RAGDEV

Runtime error

alexkueck commited on Nov 28, 2023

Commit

0d68ba0

•

1 Parent(s): feddbbb

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -290,16 +290,7 @@ def invoke (prompt, history, rag_option, openai_api_key,  temperature=0.9, max_n
         #oder an Hugging Face
         #llm = HuggingFaceHub(repo_id=repo_id, model_kwargs={"temperature": 0.5, "max_length": 64})
         #llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
-        llm = HuggingFaceTextGenInference(
-                inference_server_url="https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", #"http://localhost:8010/",
-                user = "Bearer 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",
-                max_new_tokens=max_new_tokens,
-                top_k=10,
-                top_p=top_p,
-                typical_p=0.95,
-                temperature=temperature,
-                repetition_penalty=repetition_penalty,
-            )
         #zusätzliche Dokumenten Splits aus DB zum Prompt hinzufügen (aus VektorDB - Chroma oder Mongo DB)
         if (rag_option == "An"):

         #oder an Hugging Face
         #llm = HuggingFaceHub(repo_id=repo_id, model_kwargs={"temperature": 0.5, "max_length": 64})
         #llm = HuggingFaceHub(url_??? = "https://wdgsjd6zf201mufn.us-east-1.aws.endpoints.huggingface.cloud", model_kwargs={"temperature": 0.5, "max_length": 64})
+        #llm = HuggingFaceTextGenInference( inference_server_url="http://localhost:8010/", max_new_tokens=max_new_tokens,top_k=10,top_p=top_p,typical_p=0.95,temperature=temperature,repetition_penalty=repetition_penalty,)
         #zusätzliche Dokumenten Splits aus DB zum Prompt hinzufügen (aus VektorDB - Chroma oder Mongo DB)
         if (rag_option == "An"):