Spaces:

lukestanley
/

ChillTranslator

Sleeping

lukestanley commited on Mar 4, 2024

Commit

52fc709

1 Parent(s): c4d55d5

Fix: when using http worker, only download if inference is on localhost

Files changed (1) hide show

utils.py CHANGED Viewed

@@ -36,7 +36,7 @@ LLM_MODEL_PATH = env.get("LLM_MODEL_PATH", None)
 MAX_TOKENS = int(env.get("MAX_TOKENS", 1000))
 TEMPERATURE = float(env.get("TEMPERATURE", 0.3))
-performing_local_inference = (LLM_WORKER == "in_memory" or LLM_WORKER == "http")
 if LLM_MODEL_PATH and len(LLM_MODEL_PATH) > 0:
     print(f"Using local model from {LLM_MODEL_PATH}")

 MAX_TOKENS = int(env.get("MAX_TOKENS", 1000))
 TEMPERATURE = float(env.get("TEMPERATURE", 0.3))
+performing_local_inference = (LLM_WORKER == "in_memory" or (LLM_WORKER == "http" and "localhost" in URL))
 if LLM_MODEL_PATH and len(LLM_MODEL_PATH) > 0:
     print(f"Using local model from {LLM_MODEL_PATH}")