krishnapal2308 commited on
Commit
92872fa
·
1 Parent(s): bf82131

pytorch instead of tensorflow

Browse files
__pycache__/vit_gpt2.cpython-310.pyc CHANGED
Binary files a/__pycache__/vit_gpt2.cpython-310.pyc and b/__pycache__/vit_gpt2.cpython-310.pyc differ
 
vit_gpt2.py CHANGED
@@ -1,8 +1,7 @@
1
- import tensorflow as tf
2
- from transformers import TFVisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
3
  from PIL import Image
4
 
5
- model = TFVisionEncoderDecoderModel.from_pretrained("vit-gpt2-image-captioning", from_pt=True)
6
  feature_extractor = ViTImageProcessor.from_pretrained("vit-gpt2-image-captioning")
7
  tokenizer = AutoTokenizer.from_pretrained("vit-gpt2-image-captioning")
8
 
@@ -17,7 +16,7 @@ def predict_step(img_array):
17
  if i_image.mode != "RGB":
18
  i_image = i_image.convert(mode="RGB")
19
 
20
- pixel_values = feature_extractor(images=i_image, return_tensors="tf", do_normalize=True).pixel_values
21
 
22
  output_ids = model.generate(pixel_values, **gen_kwargs)
23
 
 
1
+ from transformers import VisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer
 
2
  from PIL import Image
3
 
4
+ model = VisionEncoderDecoderModel.from_pretrained("vit-gpt2-image-captioning")
5
  feature_extractor = ViTImageProcessor.from_pretrained("vit-gpt2-image-captioning")
6
  tokenizer = AutoTokenizer.from_pretrained("vit-gpt2-image-captioning")
7
 
 
16
  if i_image.mode != "RGB":
17
  i_image = i_image.convert(mode="RGB")
18
 
19
+ pixel_values = feature_extractor(images=i_image, return_tensors="pt", do_normalize=True).pixel_values
20
 
21
  output_ids = model.generate(pixel_values, **gen_kwargs)
22