Spaces:

yasserrmd
/

DailySnap

Running on Zero

yasserrmd commited on 4 days ago

Commit

a516023

•

1 Parent(s): 3d3237e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -20,7 +20,7 @@ model = YOLOv10.from_pretrained('jameslahm/yolov10x').to(device)
 model_id = "meta-llama/Llama-3.2-11B-Vision-Instruct"
-model_code = MllamaForConditionalGeneration.from_pretrained(
     model_id,
     torch_dtype=torch.bfloat16,
     device_map="auto",
@@ -29,7 +29,7 @@ processor = AutoProcessor.from_pretrained(model_id)
 model_name = "Qwen/Qwen2.5-Coder-7B-Instruct"
-model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
@@ -81,7 +81,7 @@ def generate_image_desc(image):
     inputs = processor(image, input_text, return_tensors="pt").to(model.device)
     # Generate the output from the model
-    output = model.generate(**inputs, max_new_tokens=300)
     print(output)
     markdown_text = processor.decode(output[0])
     print(markdown_text)

 model_id = "meta-llama/Llama-3.2-11B-Vision-Instruct"
+model_vision = MllamaForConditionalGeneration.from_pretrained(
     model_id,
     torch_dtype=torch.bfloat16,
     device_map="auto",
 model_name = "Qwen/Qwen2.5-Coder-7B-Instruct"
+model_code = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
     inputs = processor(image, input_text, return_tensors="pt").to(model.device)
     # Generate the output from the model
+    output = model_vision.generate(**inputs, max_new_tokens=300)
     print(output)
     markdown_text = processor.decode(output[0])
     print(markdown_text)