rag_ColPali_Qwen2VL

Running on Zero

AdrienB134 commited on Sep 6

Commit

8575432

•

1 Parent(s): 4e37306

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -49,7 +49,7 @@ def model_inference(
         "Qwen/Qwen2-VL-2B-Instruct",
         attn_implementation="flash_attention_2", #doesn't work on zerogpu WTF?!
         trust_remote_code=True,
-        torch_dtype="auto").cuda().eval()
     # default processer
     min_pixels = 256*28*28

         "Qwen/Qwen2-VL-2B-Instruct",
         attn_implementation="flash_attention_2", #doesn't work on zerogpu WTF?!
         trust_remote_code=True,
+        torch_dtype=torch.bfloat16).to("cuda:0")
     # default processer
     min_pixels = 256*28*28