Spaces:

DataPrism
/

GPT-auto-webscraping

Runtime error

App Files Files Community

GianJSX commited on Aug 15, 2023

Commit

3d86e8b

1 Parent(s): 31ff83b

start def

Browse files

Files changed (1) hide show

app.py +32 -30

app.py CHANGED Viewed

@@ -15,26 +15,32 @@ os.environ["LANGCHAIN_ENDPOINT"]="https://api.smith.langchain.com"
 os.environ["LANGCHAIN_API_KEY"]=st.secrets["LANGCHAIN_API_KEY"]
 os.environ["LANGCHAIN_PROJECT"]=st.secrets["LANGCHAIN_PROJECT"]
 @traceable(run_type="tool")
-def start(run):
-    st.write("This app helps you to extract data from HTML code using web scraping. It uses GPT-3.5-turbo to generate the code for you. \n *Contribute to this project on [GitHub](https://github.com/CognitiveLabs/GPT-auto-webscraping)*")
-    with st.expander(label="Check out the video demo"):
-        yt_video = st.video("https://www.youtube.com/watch?v=_zeCun4OlCc")
-    info_text = """
-    **Quick start** \n
-    Fill the input with <HTML code>.
-    * Choose a repeating element on the page, like a product on a list.
-    * Inspect the HTML code and copy the element.
-    After generating the "output format" and the code, paste the complete HTML code of the page in the last input to test it
-    """
-    st.write(info_text)
-    st.image("https://j.gifs.com/gpqvPl.gif")
-    return run
-# use time library
-start(run='start')
 if assistant_api_key == '':
     assistant_api_key = st.secrets["API_KEY"]
@@ -43,20 +49,16 @@ if assistant_api_key == '':
 else:
     gpt_assistant = GPTAssistant(assistant_api_key)
-html_content = None
 # check if html_content is an url, and show error if it is
-def html_content_input():
-    html_content = st.text_input("Paste the HTML tags of the item you want to extract:", max_chars=10000, help="example: <li>Product 1 </li>, watch the video above")
-    if html_content:
-        if html_content.startswith("http"):
-            st.write("Please paste the HTML piece code, not the URL")
-            html_content = None
-    return st.button("Generate output format & code")
-extract_button = html_content_input()
 if html_content and extract_button:
     try:

 os.environ["LANGCHAIN_API_KEY"]=st.secrets["LANGCHAIN_API_KEY"]
 os.environ["LANGCHAIN_PROJECT"]=st.secrets["LANGCHAIN_PROJECT"]
+st.session_state['session_started'] = False
 @traceable(run_type="tool")
+def start_session(session_started):
+    return session_started
+# change session_started to True
+if not st.session_state['session_started']:
+    st.session_state['session_started'] = start_session(True)
+st.write("This app helps you to extract data from HTML code using web scraping. It uses GPT-3.5-turbo to generate the code for you. \n *Contribute to this project on [GitHub](https://github.com/CognitiveLabs/GPT-auto-webscraping)*")
+with st.expander(label="Check out the video demo"):
+    yt_video = st.video("https://www.youtube.com/watch?v=_zeCun4OlCc")
+info_text = """
+**Quick start** \n
+Fill the input with <HTML code>.
+-Choose a repeating element on the page, like a product on a list.
+-Inspect the HTML code and copy the element.
+-After generating the "output format" and the code, paste the complete HTML code of the page in the last input to test it
+"""
+st.write(info_text)
+st.image("https://j.gifs.com/gpqvPl.gif")
 if assistant_api_key == '':
     assistant_api_key = st.secrets["API_KEY"]
 else:
     gpt_assistant = GPTAssistant(assistant_api_key)
+# get the html content
+html_content = st.text_input("Paste the HTML tags of the item you want to extract:", max_chars=10000, help="example: <li>Product 1 </li>, watch the video above")
 # check if html_content is an url, and show error if it is
+if html_content:
+    if html_content.startswith("http"):
+        st.write("Please paste the HTML piece code, not the URL")
+        html_content = None
+extract_button = st.button("Generate output format & code")
 if html_content and extract_button:
     try: