Spaces:

vincentmin
/

ArxivNewsLetter

Sleeping

App Files Files Community

vincentmin commited on Jun 25, 2023

Commit

93f881f

1 Parent(s): d3db9a3

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -16

app.py CHANGED Viewed

@@ -5,15 +5,12 @@ from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain.vectorstores import Chroma
 from langchain.embeddings import HuggingFaceEmbeddings
 from langchain.llms import HuggingFaceHub
-# from langchain.llms import FakeListLLM
 from langchain.chains import LLMChain, StuffDocumentsChain
 from langchain.prompts import PromptTemplate
 from langchain.schema import Document
 LOAD_MAX_DOCS = 100
-# CHUNK_SIZE = 1000
-# text_splitter = RecursiveCharacterTextSplitter(chunk_size=CHUNK_SIZE)
 embeddings = HuggingFaceEmbeddings()
@@ -25,7 +22,6 @@ prompt = PromptTemplate(
   template="""Write a personalised newsletter for a researcher on the most recent exciting developments in his field. The researcher describes his work as follows:"{context}". Base the newsletter on the articles below. Extract the most exciting points and combine them into an excillerating newsletter. Use Markdown format\n#ARTICLES\n\n"{text}"\n\nNEWSLETTER:\n# Your AI curated newsletter\n""",
   input_variables=["context", "text"])
-# llm = FakeListLLM(responses=list(map(str, range(100))))
 REPO_ID = "HuggingFaceH4/starchat-beta"
 llm = HuggingFaceHub(
     repo_id=REPO_ID,
@@ -53,7 +49,7 @@ def process_document(doc: Document):
 def get_data(lookback_days: float, user_query: str):
     print("User query:", user_query)
     max_date = date.today()
-    min_date = (max_date - timedelta(days=3)).strftime('%Y%m%d')
     query = f"cat:hep-th AND submittedDate:[{min_date.strftime('%Y%m%d')} TO {max_date.strftime('%Y%m%d')}]"
     loader = ArxivLoader(query=query, load_max_docs=LOAD_MAX_DOCS)
     docs = loader.load()
@@ -70,14 +66,6 @@ def get_data(lookback_days: float, user_query: str):
     print("LLM output:", output_text)
     return f"# Your AI curated newsletter\n{output['output_text']}\n\n\n\n## Used articles:\n\n{articles}"
-# demo = gr.Interface(
-#     fn=get_data,
-#     inputs=[lookback_days, input_text]
-#     outputs=gr.Markdown(),
-#     title="Arxiv AI Curated Newsletter",
-#     description="Describe your field of research in a few words to get a newsletter-style summary of today's Arxiv articles.",
-# )
 with gr.Blocks() as demo:
     gr.Markdown(
         """
@@ -87,14 +75,17 @@ with gr.Blocks() as demo:
         Get a newsletter-style summary of today's Arxiv articles personalised to your field of research.
         """
     )
-    lookback_days = gr.Number(2, label="Articles from this many days in the past will be searched through.", minimum=1, maximum=7)
     input_text = gr.Textbox(placeholder="Describe your field of research in a few words")
     gr.Examples(
         [["Supersymmetric Conformal Field Theory"], ["Black hole information paradox"]],
         input_text,
     )
     output = gr.Markdown()
-    input_text.change(fn=get_data, inputs=[lookback_days,input_text], outputs=output)
     demo.queue().launch()

 from langchain.vectorstores import Chroma
 from langchain.embeddings import HuggingFaceEmbeddings
 from langchain.llms import HuggingFaceHub
 from langchain.chains import LLMChain, StuffDocumentsChain
 from langchain.prompts import PromptTemplate
 from langchain.schema import Document
 LOAD_MAX_DOCS = 100
 embeddings = HuggingFaceEmbeddings()
   template="""Write a personalised newsletter for a researcher on the most recent exciting developments in his field. The researcher describes his work as follows:"{context}". Base the newsletter on the articles below. Extract the most exciting points and combine them into an excillerating newsletter. Use Markdown format\n#ARTICLES\n\n"{text}"\n\nNEWSLETTER:\n# Your AI curated newsletter\n""",
   input_variables=["context", "text"])
 REPO_ID = "HuggingFaceH4/starchat-beta"
 llm = HuggingFaceHub(
     repo_id=REPO_ID,
 def get_data(lookback_days: float, user_query: str):
     print("User query:", user_query)
     max_date = date.today()
+    min_date = (max_date - timedelta(days=lookback_days))
     query = f"cat:hep-th AND submittedDate:[{min_date.strftime('%Y%m%d')} TO {max_date.strftime('%Y%m%d')}]"
     loader = ArxivLoader(query=query, load_max_docs=LOAD_MAX_DOCS)
     docs = loader.load()
     print("LLM output:", output_text)
     return f"# Your AI curated newsletter\n{output['output_text']}\n\n\n\n## Used articles:\n\n{articles}"
 with gr.Blocks() as demo:
     gr.Markdown(
         """
         Get a newsletter-style summary of today's Arxiv articles personalised to your field of research.
         """
     )
+    with gr.Accordion("Parameters", open=False):
+        lookback_days = gr.Number(2, label="Articles from this many days in the past will be searched through.", minimum=1, maximum=7)
     input_text = gr.Textbox(placeholder="Describe your field of research in a few words")
     gr.Examples(
         [["Supersymmetric Conformal Field Theory"], ["Black hole information paradox"]],
         input_text,
     )
     output = gr.Markdown()
+    btn = gr.Button(value="Submit")
+    btn.click(fn=get_data, inputs=[lookback_days,input_text], outputs=output)
     demo.queue().launch()