AdrienB134 commited on
Commit
8575432
1 Parent(s): 4e37306

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -49,7 +49,7 @@ def model_inference(
49
  "Qwen/Qwen2-VL-2B-Instruct",
50
  attn_implementation="flash_attention_2", #doesn't work on zerogpu WTF?!
51
  trust_remote_code=True,
52
- torch_dtype="auto").cuda().eval()
53
 
54
  # default processer
55
  min_pixels = 256*28*28
 
49
  "Qwen/Qwen2-VL-2B-Instruct",
50
  attn_implementation="flash_attention_2", #doesn't work on zerogpu WTF?!
51
  trust_remote_code=True,
52
+ torch_dtype=torch.bfloat16).to("cuda:0")
53
 
54
  # default processer
55
  min_pixels = 256*28*28