search-assistant-maqal

Paused

App Files Files Community

arabellastrange commited on Jul 29, 2024

Commit

65fa153

1 Parent(s): 3b97df8

backup offline search

Browse files

Files changed (2) hide show

app.py +42 -12
read_write_index.py +1 -2

app.py CHANGED Viewed

@@ -7,11 +7,30 @@ from llama_index.core import Document, VectorStoreIndex
 from generate_response import generate_chat_response_with_history, set_llm, is_search_query, condense_question, \
     generate_chat_response_with_history_rag_return_response
 from web_search import search
 API_KEY_PATH = "../keys/gpt_api_key.txt"
 logger = logging.getLogger("agent_logger")
 def google_search_chat(message, history):
     condensed_question = condense_question(message, history)
@@ -29,21 +48,32 @@ def google_search_chat(message, history):
             index = VectorStoreIndex.from_documents(documents)
             print('Search results vectorized...')
             response = generate_chat_response_with_history_rag_return_response(index, message, history)
-            response_text = []
-            string_output = ""
-            for text in response.response_gen:
-                response_text.append(text)
-                string_output = ''.join(response_text)
-                yield string_output
-            yield string_output + f'\n\n --- \n **Sources used:** \n {sources}'
-            print(f'Assistant Response: {string_output}')
-        else:
-            print(
-                f'Assistant Response: Sorry, no search results found.')
-            yield "Sorry, no search results found."
     else:
         yield from generate_chat_response_with_history(message, history)

 from generate_response import generate_chat_response_with_history, set_llm, is_search_query, condense_question, \
     generate_chat_response_with_history_rag_return_response
+from read_write_index import read_write_index
 from web_search import search
 API_KEY_PATH = "../keys/gpt_api_key.txt"
 logger = logging.getLogger("agent_logger")
+mush_sources = ("1. https://en.wikipedia.org/wiki/Mushroom_poisoning \n"
+                "2. https://thehomesteadtraveler.com/foraging-for-mushrooms-in-italy/ \n"
+                "3. https://funghimagazine.it/mushroom-hunting-in-italy/")
+email_sources = (
+    "1. https://support.microsoft.com/en-us/office/advanced-outlook-com-security-for-microsoft-365-subscribers-882d2243-eab9-4545-a58a-b36fee4a46e2"
+    "\n 2. https://support.microsoft.com/en-us/office/security-and-privacy-in-outlook-web-app-727a553e-5502-4899-b1ea-c84a9ddde2af"
+    "\n 3. https://support.microsoft.com/en-us/office/delay-or-schedule-sending-email-messages-in-outlook-026af69f-c287-490a-a72f-6c65793744ba"
+    "\n 4. https://www.paubox.com/blog/scheduling-emails-and-hipaa-compliance")
+cake_sources = ("1. https://www.indianhealthyrecipes.com/eggless-carrot-cake/"
+                "\n 2. https://www.pccmarkets.com/taste/2013-03/egg_substitutes/"
+                "\n 3. https://www.healthdirect.gov.au/nut-allergies")
+art_sources = ("1. https://en.wikipedia.org/wiki/Post-Impressionism"
+               "\n 2. https://www.metmuseum.org/toah/hd/poim/hd_poim.htm"
+               "\n 3. https://www.britannica.com/art/Post-Impressionism"
+               "\n 4. https://www.theartstory.org/movement/post-impressionism/")
 def google_search_chat(message, history):
     condensed_question = condense_question(message, history)
             index = VectorStoreIndex.from_documents(documents)
             print('Search results vectorized...')
             response = generate_chat_response_with_history_rag_return_response(index, message, history)
+        else:
+            print(f'Assistant Response: Sorry, no search results found, trying offline backup...')
+            index = read_write_index(path='storage_search/')
+            response = generate_chat_response_with_history_rag_return_response(index, message, history)
+            if "mushroom" in message.lower() or "poison" in message.lower() or "italy" in message.lower():
+                sources = mush_sources
+            elif "email" in message.lower() or "data" in message.lower() or "gdpr" in message.lower():
+                sources = email_sources
+            elif "cake" in message.lower() or "egg" in message.lower() or "nut" in message.lower():
+                sources = cake_sources
+            elif "art" in message.lower() or "post-impressionism" in message.lower() or "postimpressionism" in message.lower():
+                sources = art_sources
+            else:
+                sources = "No sources available for this response."
+        response_text = []
+        string_output = ""
+        for text in response.response_gen:
+            response_text.append(text)
+            string_output = ''.join(response_text)
+            yield string_output
+        yield string_output + f'\n\n --- \n **Sources used:** \n {sources}'
+        print(f'Assistant Response: {string_output}')
     else:
         yield from generate_chat_response_with_history(message, history)

read_write_index.py CHANGED Viewed

@@ -4,8 +4,7 @@ import os
 from llama_index.core import SimpleDirectoryReader, VectorStoreIndex, StorageContext, load_index_from_storage
 logger = logging.getLogger(__name__)
-DOCUMENT_PATH = '../data'
 # remember to delete stored vectors when new documents are added to the data so the storage is recreated

 from llama_index.core import SimpleDirectoryReader, VectorStoreIndex, StorageContext, load_index_from_storage
 logger = logging.getLogger(__name__)
+DOCUMENT_PATH = 'search_data'
 # remember to delete stored vectors when new documents are added to the data so the storage is recreated