Qwen2-VL-7B

Running on Zero

App Files Files Community

KingNish commited on Sep 18, 2024

Commit

88bde73

verified ·

1 Parent(s): ab06fa9

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -25

app.py CHANGED Viewed

@@ -8,8 +8,6 @@ import subprocess
 from datetime import datetime
 import numpy as np
 import os
-from moviepy.editor import VideoFileClip
-import loadimg
 # Install flash-attn
 subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
@@ -21,35 +19,16 @@ processor = AutoProcessor.from_pretrained(MODEL_ID, trust_remote_code=True)
 DESCRIPTION = "[Qwen2-VL-7B Demo](https://huggingface.co/Qwen/Qwen2-VL-7B-Instruct)"
-# Helper function to save media and return path
-def save_media_and_get_path(media, media_type):
-    if media is None:
-        gr.Warning(f"No {media_type} provided. Please upload a {media_type} before submitting.")
-        raise ValueError(f"No {media_type} provided.")
-    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
-    filename = f"{media_type}_{timestamp}.{'png' if media_type == 'image' else 'webm'}"
-    if media_type == "image":
-        media = loadimg(media, "pil")
-        media.save(filename)
-    elif media_type == "video":
-        VideoFileClip(media).write_videofile(filename, fps=8, audio=False)
-    return os.path.abspath(filename)
 @spaces.GPU
-def qwen_inference(media, text_input=None):
-    print(media)
     image_extensions = Image.registered_extensions()
-    if media.endswith(tuple([i for i, f in image_extensions.items()])):
         media_type = "image"
-    elif media.endswith(("avi", "mp4", "mov", "mkv", "flv", "wmv", "mjpeg", "wav", "gif", "webm", "m4v", "3gp")):  # Check if it's a video path
         media_type = "video"
     else:
         raise ValueError("Unsupported media type. Please upload an image or video.")
-    media_path = media
     messages = [
         {

 from datetime import datetime
 import numpy as np
 import os
 # Install flash-attn
 subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
 DESCRIPTION = "[Qwen2-VL-7B Demo](https://huggingface.co/Qwen/Qwen2-VL-7B-Instruct)"
 @spaces.GPU
+def qwen_inference(media_path, text_input=None):
     image_extensions = Image.registered_extensions()
+    if media_path.endswith(tuple([i for i, f in image_extensions.items()])):
         media_type = "image"
+    elif media_path.endswith(("avi", "mp4", "mov", "mkv", "flv", "wmv", "mjpeg", "wav", "gif", "webm", "m4v", "3gp")):  # Check if it's a video path
         media_type = "video"
     else:
         raise ValueError("Unsupported media type. Please upload an image or video.")
     messages = [
         {