Spaces:
Running
on
Zero
Running
on
Zero
dongyh20
commited on
Commit
·
8a47087
1
Parent(s):
4ef079c
update space
Browse files
app.py
CHANGED
@@ -154,6 +154,8 @@ def extract_audio(videos_file_path):
|
|
154 |
@spaces.GPU(duration=120)
|
155 |
def ola_inference(multimodal, audio_path):
|
156 |
visual, text = multimodal["files"][0], multimodal["text"]
|
|
|
|
|
157 |
if visual.endswith("image2.png"):
|
158 |
modality = "video"
|
159 |
visual = f"{cur_dir}/case/case1.mp4"
|
@@ -216,6 +218,8 @@ def ola_inference(multimodal, audio_path):
|
|
216 |
else:
|
217 |
qs = ''
|
218 |
if USE_SPEECH and audio_path:
|
|
|
|
|
219 |
qs = DEFAULT_IMAGE_TOKEN + "\n" + "User's question in speech: " + DEFAULT_SPEECH_TOKEN + '\n'
|
220 |
elif USE_SPEECH:
|
221 |
qs = DEFAULT_SPEECH_TOKEN + DEFAULT_IMAGE_TOKEN + "\n" + qs
|
|
|
154 |
@spaces.GPU(duration=120)
|
155 |
def ola_inference(multimodal, audio_path):
|
156 |
visual, text = multimodal["files"][0], multimodal["text"]
|
157 |
+
if not visual:
|
158 |
+
return "ERROR: Image or Video is required.", None
|
159 |
if visual.endswith("image2.png"):
|
160 |
modality = "video"
|
161 |
visual = f"{cur_dir}/case/case1.mp4"
|
|
|
218 |
else:
|
219 |
qs = ''
|
220 |
if USE_SPEECH and audio_path:
|
221 |
+
if text:
|
222 |
+
return "ERROR: Please provide either text or audio question for image, not both.", None
|
223 |
qs = DEFAULT_IMAGE_TOKEN + "\n" + "User's question in speech: " + DEFAULT_SPEECH_TOKEN + '\n'
|
224 |
elif USE_SPEECH:
|
225 |
qs = DEFAULT_SPEECH_TOKEN + DEFAULT_IMAGE_TOKEN + "\n" + qs
|