EyeSee_chi

Running

App Files Files Community

Niki Zhang commited on Jul 1, 2024

Commit

7dc7f05

verified ·

1 Parent(s): 9a7446e

Update app.py

Browse files

Files changed (1) hide show

app.py +68 -59

app.py CHANGED Viewed

@@ -1009,7 +1009,7 @@ async def upload_callback(image_input,state, log_state, task_type, visual_chatgp
         image_input.save(new_image_path)
         print("img_path",new_image_path)
         visual_chatgpt.current_image = new_image_path
-        paragraph = get_gpt_response(openai_api_key, new_image_path,f"What's going on in this picture? in {language}")
         # visual_chatgpt.agent.memory.buffer = visual_chatgpt.agent.memory.buffer + visual_chatgpt.global_prompt
         if task_type=="task 3":
             name="Along the River During the Qingming Festival"
@@ -1017,6 +1017,7 @@ async def upload_callback(image_input,state, log_state, task_type, visual_chatgp
             year="12th century (Song Dynasty)"
             material="Chinese painting"
             gender="male"
         elif task_type=="task 1":
             name ="The Ambassadors"
@@ -1024,6 +1025,7 @@ async def upload_callback(image_input,state, log_state, task_type, visual_chatgp
             year = "1533 (Northern Renaissance)"
             material="Realism"
             gender = "male"
         elif task_type=="task 2":
             name = "The Football Players"
@@ -1031,18 +1033,15 @@ async def upload_callback(image_input,state, log_state, task_type, visual_chatgp
             year= "1912 (Cubism)"
             material="Cubism"
             gender= "male"
         else:
             parsed_data = get_gpt_response(openai_api_key, new_image_path,"Please provide the name, artist, year of creation (including the art historical period), and painting style used for this painting. Return the information in dictionary format without any newline characters. Format as follows: { \"name\": \"Name of the painting\", \"artist\": \"Name of the artist\", \"year\": \"Year of creation (Art historical period)\", \"style\": \"Painting style used in the painting\",\"gender\": \"The gender of the author\"}")
             print(parsed_data)
             parsed_data = json.loads(parsed_data.replace("'", "\""))
             name, artist, year, material,gender= parsed_data["name"],parsed_data["artist"],parsed_data["year"], parsed_data["style"],parsed_data['gender']
             gender=gender.lower()
-        print("gender",gender)
-        print("material",material)
     if language=="English":
         if naritive_mapping[narritive]==0 :
             msg=f"🤖 Hi, I am EyeSee. Let's explore this painting '{name}' together. You can click on the area you're interested in and choose from four types of information: Description, Analysis, Interpretation, and Judgment. Based on your selection, I will provide you with the relevant information."
@@ -1708,56 +1707,60 @@ async def texttospeech(text, language,gender='female'):
         return None
 # give the reason of recommendation
-async def item_associate(new_crop,openai_api_key,language,autoplay,length,log_state,sort_score,narritive,state, evt: gr.SelectData):
-    persona=naritive_mapping[narritive]
-    rec_path=evt._data['value']['image']['path']
-    index="Item Recommendation Picture "+ str(evt.index)
-    print("rec_path",rec_path)
-    prompt=recommendation_prompt[0][persona].format(language=language,length=length)
-    image_paths=[new_crop,rec_path]
-    result=get_gpt_response(openai_api_key, image_paths, prompt)
-    print("recommend result",result)
-    state += [(None, f"{result}")]
-    log_state += [("User wants to know object recomendation reason", None)]
-    log_state = log_state + [(narritive, None)]
-    log_state = log_state + [(f"image sort ranking {sort_score}", None)]
-    log_state = log_state + [(None, f"{result}")]
-    read_info = re.sub(r'[#[\]!*]','',result)
-    read_info = emoji.replace_emoji(read_info,replace="")
-    print("associate",read_info)
-    audio_output=None
-    if autoplay:
-        audio_output = await texttospeech(read_info, language)
-    return state,state,audio_output,log_state,index,gr.update(value=[])
-async def style_associate(image_path,openai_api_key,language,autoplay,length,log_state,sort_score,narritive,state,artist,evt: gr.SelectData):
-    persona=naritive_mapping[narritive]
-    rec_path=evt._data['value']['image']['path']
-    index="Style Recommendation Picture "+str(evt.index)
-    print("rec_path",rec_path)
-    if persona==1:
-        prompt=recommendation_prompt[1][persona].format(language=language,length=length,artist=artist[8:])
-    else:
-        prompt=recommendation_prompt[1][persona].format(language=language,length=length)
-    image_paths=[image_path,rec_path]
-    result=get_gpt_response(openai_api_key, image_paths, prompt )
-    print("recommend result",result)
-    state += [(None, f"{result}")]
-    log_state += [("User wants to know style recomendation reason", None)]
-    log_state = log_state + [(narritive, None)]
-    log_state = log_state + [(f"image sort ranking {sort_score}", None)]
-    log_state = log_state + [(None, f"{result}")]
-    read_info = re.sub(r'[#[\]!*]','',result)
-    read_info = emoji.replace_emoji(read_info,replace="")
-    print("associate",read_info)
-    audio_output=None
-    if autoplay:
-        audio_output = await texttospeech(read_info, language)
-    return state,state,audio_output,log_state,index,gr.update(value=[])
 def change_naritive(session_type,image_input, state, click_state, paragraph, origin_image,narritive,task_instruct,gallery_output,style_gallery_result,reco_reasons,language="English"):
@@ -2131,6 +2134,12 @@ def create_ui():
                         # show_download_button=True
                         )
             with gr.Column(scale=4,visible=False) as reco_reasons:
                 recommend_bot = gr.Chatbot(label="Recommend Reasons", elem_classes="chatbot",height=600)
@@ -2321,7 +2330,7 @@ def create_ui():
         gallery_result.select(
             item_associate,
-            inputs=[new_crop_save_path,openai_api_key,language,auto_play,length,log_state,sort_rec,naritive,recomended_state],
             outputs=[recommend_bot,recomended_state,output_audio,log_state,pic_index,recommend_score],
@@ -2329,7 +2338,7 @@ def create_ui():
         style_gallery_result.select(
             style_associate,
-            inputs=[image_path,openai_api_key,language,auto_play,length,log_state,sort_rec,naritive,recomended_state,artist_label],
             outputs=[recommend_bot,recomended_state,output_audio,log_state,pic_index,recommend_score],

         image_input.save(new_image_path)
         print("img_path",new_image_path)
         visual_chatgpt.current_image = new_image_path
         # visual_chatgpt.agent.memory.buffer = visual_chatgpt.agent.memory.buffer + visual_chatgpt.global_prompt
         if task_type=="task 3":
             name="Along the River During the Qingming Festival"
             year="12th century (Song Dynasty)"
             material="Chinese painting"
             gender="male"
+            paragraph="This image depicts a traditional Chinese medicine clinic scene from an ancient painting. The interior of the clinic shows various activities related to traditional Chinese medical practices. Inside the clinic: 1. To the right, a practitioner is consulting with a patient, examining the pulse, which is a common diagnostic method in traditional Chinese medicine. 2. To the far right, another practitioner is seated at a desk, likely preparing or recording prescriptions. Behind him is a traditional Chinese medicine cabinet with numerous drawers for storing herbs and medicinal ingredients.3. On the left side of the clinic, there are patients seated, possibly waiting for their turn for consultation or treatment.4. Wall hangings, presumably diagrams or medical posters, are displayed within the clinic.Outside and around the clinic: 1. People walking by or moving around, possibly other patients or townspeople, indicating the scene takes place in a lively community setting.2. Someone carrying goods in a traditional yoke balanced across their shoulders, indicative of daily life and commerce. This scene provides a detailed glimpse into the practice of traditional Chinese medicine and everyday life in historical China."
         elif task_type=="task 1":
             name ="The Ambassadors"
             year = "1533 (Northern Renaissance)"
             material="Realism"
             gender = "male"
+            paragraph="This image is a famous painting known as \"The Ambassadors\" by Hans Holbein the Younger, created in 1533. In the painting, there are two men standing on either side of a table covered with a rich carpet. The man on the left is dressed in elaborate, luxurious clothing, indicating his high social status, and holds a dagger. The man on the right is dressed in more somber, clerical attire, possibly denoting a scholarly or ecclesiastical position.The table between them is filled with various objects, including scientific instruments like a globe, a sundial, a quadrant, and books, reflecting the intellectual interests and pursuits of the time, specifically in navigation and astronomy. A significant detail in the painting is the distorted object at the bottom center, which, when viewed from an angle, reveals itself to be a skull — a classic example of anamorphosis. This hidden skull serves as a memento mori, reminding viewers of the inevitability of death, a common theme in Renaissance art."
         elif task_type=="task 2":
             name = "The Football Players"
             year= "1912 (Cubism)"
             material="Cubism"
             gender= "male"
+            paragraph="This image is a painting titled \"The Football Players\" created by the artist Albert Gleizes in 1912. It is an example of Cubist art, a style characterized by fragmented and abstract representations. The painting depicts a group of football players, mid-action, seemingly in the midst of a game. The figures are rendered in geometric shapes and planes, creating a sense of movement and dynamism. The use of intersecting lines and overlapping forms adds to the dynamic and somewhat chaotic feel of the composition. The use of color and form communicates the energy and intensity of the sport."
         else:
+            paragraph = get_gpt_response(openai_api_key, new_image_path,f"What's going on in this picture? in {language}")
             parsed_data = get_gpt_response(openai_api_key, new_image_path,"Please provide the name, artist, year of creation (including the art historical period), and painting style used for this painting. Return the information in dictionary format without any newline characters. Format as follows: { \"name\": \"Name of the painting\", \"artist\": \"Name of the artist\", \"year\": \"Year of creation (Art historical period)\", \"style\": \"Painting style used in the painting\",\"gender\": \"The gender of the author\"}")
             print(parsed_data)
             parsed_data = json.loads(parsed_data.replace("'", "\""))
             name, artist, year, material,gender= parsed_data["name"],parsed_data["artist"],parsed_data["year"], parsed_data["style"],parsed_data['gender']
             gender=gender.lower()
     if language=="English":
         if naritive_mapping[narritive]==0 :
             msg=f"🤖 Hi, I am EyeSee. Let's explore this painting '{name}' together. You can click on the area you're interested in and choose from four types of information: Description, Analysis, Interpretation, and Judgment. Based on your selection, I will provide you with the relevant information."
         return None
 # give the reason of recommendation
+async def item_associate(new_crop,openai_api_key,language,autoplay,length,log_state,sort_score,narritive,state,recommend_type,evt: gr.SelectData):
+    if recommend_type=="Reasons":
+        persona=naritive_mapping[narritive]
+        rec_path=evt._data['value']['image']['path']
+        index="Item Recommendation Picture "+ str(evt.index)
+        print("rec_path",rec_path)
+        prompt=recommendation_prompt[0][persona].format(language=language,length=length)
+        image_paths=[new_crop,rec_path]
+        result=get_gpt_response(openai_api_key, image_paths, prompt)
+        print("recommend result",result)
+        state += [(None, f"{result}")]
+        log_state += [("User wants to know object recomendation reason", None)]
+        log_state = log_state + [(narritive, None)]
+        log_state = log_state + [(f"image sort ranking {sort_score}", None)]
+        log_state = log_state + [(None, f"{result}")]
+        read_info = re.sub(r'[#[\]!*]','',result)
+        read_info = emoji.replace_emoji(read_info,replace="")
+        print("associate",read_info)
+        audio_output=None
+        if autoplay:
+            audio_output = await texttospeech(read_info, language)
+        return state,state,audio_output,log_state,index,gr.update(value=[])
+    return state,state,None,log_state,None,gr.update(value=[])
+async def style_associate(image_path,openai_api_key,language,autoplay,length,log_state,sort_score,narritive,state,artist,recommend_type,evt: gr.SelectData):
+    if recommend_type=="Reasons":
+        persona=naritive_mapping[narritive]
+        rec_path=evt._data['value']['image']['path']
+        index="Style Recommendation Picture "+str(evt.index)
+        print("rec_path",rec_path)
+        if persona==1:
+            prompt=recommendation_prompt[1][persona].format(language=language,length=length,artist=artist[8:])
+        else:
+            prompt=recommendation_prompt[1][persona].format(language=language,length=length)
+        image_paths=[image_path,rec_path]
+        result=get_gpt_response(openai_api_key, image_paths, prompt )
+        print("recommend result",result)
+        state += [(None, f"{result}")]
+        log_state += [("User wants to know style recomendation reason", None)]
+        log_state = log_state + [(narritive, None)]
+        log_state = log_state + [(f"image sort ranking {sort_score}", None)]
+        log_state = log_state + [(None, f"{result}")]
+        read_info = re.sub(r'[#[\]!*]','',result)
+        read_info = emoji.replace_emoji(read_info,replace="")
+        print("associate",read_info)
+        audio_output=None
+        if autoplay:
+            audio_output = await texttospeech(read_info, language)
+        return state,state,audio_output,log_state,index,gr.update(value=[])
+    return state,state,None,log_state,None,gr.update(value=[])
 def change_naritive(session_type,image_input, state, click_state, paragraph, origin_image,narritive,task_instruct,gallery_output,style_gallery_result,reco_reasons,language="English"):
                         # show_download_button=True
                         )
+                    recommend_type = gr.Radio(
+                            choices=["Preview","Reasons"],
+                            label="Information Type",
+                            value="Preview",
+                            interactive=True)
             with gr.Column(scale=4,visible=False) as reco_reasons:
                 recommend_bot = gr.Chatbot(label="Recommend Reasons", elem_classes="chatbot",height=600)
         gallery_result.select(
             item_associate,
+            inputs=[new_crop_save_path,openai_api_key,language,auto_play,length,log_state,sort_rec,naritive,recomended_state,recommend_type],
             outputs=[recommend_bot,recomended_state,output_audio,log_state,pic_index,recommend_score],
         style_gallery_result.select(
             style_associate,
+            inputs=[image_path,openai_api_key,language,auto_play,length,log_state,sort_rec,naritive,recomended_state,artist_label,recommend_type],
             outputs=[recommend_bot,recomended_state,output_audio,log_state,pic_index,recommend_score],