Spaces:
Sleeping
Sleeping
krishnapal2308
commited on
Commit
·
92872fa
1
Parent(s):
bf82131
pytorch instead of tensorflow
Browse files- __pycache__/vit_gpt2.cpython-310.pyc +0 -0
- vit_gpt2.py +3 -4
__pycache__/vit_gpt2.cpython-310.pyc
CHANGED
Binary files a/__pycache__/vit_gpt2.cpython-310.pyc and b/__pycache__/vit_gpt2.cpython-310.pyc differ
|
|
vit_gpt2.py
CHANGED
@@ -1,8 +1,7 @@
|
|
1 |
-
import
|
2 |
-
from transformers import TFVisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
|
3 |
from PIL import Image
|
4 |
|
5 |
-
model =
|
6 |
feature_extractor = ViTImageProcessor.from_pretrained("vit-gpt2-image-captioning")
|
7 |
tokenizer = AutoTokenizer.from_pretrained("vit-gpt2-image-captioning")
|
8 |
|
@@ -17,7 +16,7 @@ def predict_step(img_array):
|
|
17 |
if i_image.mode != "RGB":
|
18 |
i_image = i_image.convert(mode="RGB")
|
19 |
|
20 |
-
pixel_values = feature_extractor(images=i_image, return_tensors="
|
21 |
|
22 |
output_ids = model.generate(pixel_values, **gen_kwargs)
|
23 |
|
|
|
1 |
+
from transformers import VisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
|
|
|
2 |
from PIL import Image
|
3 |
|
4 |
+
model = VisionEncoderDecoderModel.from_pretrained("vit-gpt2-image-captioning")
|
5 |
feature_extractor = ViTImageProcessor.from_pretrained("vit-gpt2-image-captioning")
|
6 |
tokenizer = AutoTokenizer.from_pretrained("vit-gpt2-image-captioning")
|
7 |
|
|
|
16 |
if i_image.mode != "RGB":
|
17 |
i_image = i_image.convert(mode="RGB")
|
18 |
|
19 |
+
pixel_values = feature_extractor(images=i_image, return_tensors="pt", do_normalize=True).pixel_values
|
20 |
|
21 |
output_ids = model.generate(pixel_values, **gen_kwargs)
|
22 |
|