WhatsInThisVideo

Sleeping

App Files Files Community

Rahatara commited on Aug 28, 2024

Commit

8a33723

verified ·

1 Parent(s): 31c8ea2

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -29

app.py CHANGED Viewed

@@ -29,50 +29,44 @@ def frame_capture(video_path, num_frames=5):
     vidObj.release()
     return frames
-# Function to generate text descriptions for frames
-def generate_descriptions_for_frames(video_path):
     frames = frame_capture(video_path)
     images = [PIL.Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)) for frame in frames]
-    prompt = "Describe what is happening in each of these frames in this video sequentially."
-    images_with_prompt = [prompt] + images
-    responses = model.generate_content(images_with_prompt)
-    descriptions = [response.text for response in responses]
-    formatted_description = format_descriptions(descriptions)
-    return formatted_description
-# Function to handle chat interaction
-def chat_interaction(video_path, chatbot, user_message):
-    frames = frame_capture(video_path)
-    images = [PIL.Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)) for frame in frames]
-    prompt = f"Based on these video frames, {user_message}"
     images_with_prompt = [prompt] + images
     responses = model.generate_content(images_with_prompt)
-    response_text = responses[-1].text if user_message.strip() else format_descriptions([r.text for r in responses])
-    chatbot.append((user_message, response_text))
-    return "", chatbot
 # Helper function to format descriptions
 def format_descriptions(descriptions):
     return ' '.join(descriptions).strip()
-# Tab 2: Interactive Chat Mode
-with gr.Blocks() as tab2:
-    with gr.Column():
-        gr.Markdown("### Interactive Chat Mode")
-        video_input_2 = gr.Video(label="Upload Video", autoplay=True)
-        chatbot = gr.Chatbot(label="Video Analysis Chatbot")
-        user_input = gr.Textbox(label="Ask something specific about the video", placeholder="E.g., Are there any cars in this video?")
-        user_input.submit(fn=chat_interaction, inputs=[video_input_2, chatbot, user_input], outputs=[user_input, chatbot])
-# Combine the two tabs into a single interface
 with gr.Blocks() as demo:
-    gr.TabbedInterface([tab2], ["Video Analysis", "Interactive Chat"])
 demo.launch()

     vidObj.release()
     return frames
+# Function to generate text descriptions for frames or answer a specific question
+def analyze_video(video_path, user_question):
     frames = frame_capture(video_path)
     images = [PIL.Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)) for frame in frames]
+    if user_question.strip():
+        prompt = f"Based on these video frames, {user_question}"
+    else:
+        prompt = "Describe what is happening in each of these frames in this video."
     images_with_prompt = [prompt] + images
     responses = model.generate_content(images_with_prompt)
+    descriptions = [response.text for response in responses]
+    return descriptions[-1] if user_question.strip() else format_descriptions(descriptions)
 # Helper function to format descriptions
 def format_descriptions(descriptions):
     return ' '.join(descriptions).strip()
+# Function to handle chat interaction
+def chat_interaction(video_path, chatbot, user_message):
+    response = analyze_video(video_path, user_message)
+    chatbot.append((user_message, response))
+    return "", chatbot
+# Define Gradio interface
+video_input = gr.Video(label="Upload Video", autoplay=True)
+chatbot = gr.Chatbot(label="Video Analysis Chatbot")
+user_input = gr.Textbox(label="Ask something specific about the video", placeholder="E.g., Are there any cars in this video?")
+# Create Gradio app
 with gr.Blocks() as demo:
+    with gr.Column():
+        video_input.render()
+        chatbot.render()
+        user_input.render()
+        user_input.submit(fn=chat_interaction, inputs=[video_input, chatbot, user_input], outputs=[user_input, chatbot])
 demo.launch()