Spaces:
Sleeping
Sleeping
File size: 879 Bytes
d3cd5c1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 |
from PIL import Image
from transformers import AutoTokenizer
from moondream.hf import LATEST_REVISION, Moondream, detect_device
device, dtype = detect_device()
model_id = "vikhyatk/moondream2"
tokenizer = AutoTokenizer.from_pretrained(model_id, revision=LATEST_REVISION)
moondream = Moondream.from_pretrained(
model_id,
revision=LATEST_REVISION,
torch_dtype=dtype,
).to(device=device)
moondream.eval()
image1 = Image.open("assets/demo-1.jpg")
image2 = Image.open("assets/demo-2.jpg")
prompts = [
"What is the girl doing?",
"What color is the girl's hair?",
"What is this?",
"What is behind the stand?",
]
answers = moondream.batch_answer(
images=[image1, image1, image2, image2],
prompts=prompts,
tokenizer=tokenizer,
)
for question, answer in zip(prompts, answers):
print(f"Q: {question}")
print(f"A: {answer}")
print()
|