Spaces:

Bhashini-IITJ
/

IndicPhotoOCR

Running

anikde commited on 8 days ago

Commit

ec00790

1 Parent(s): ef23964

added device config for ViT

Files changed (2) hide show

IndicPhotoOCR/ocr.py CHANGED Viewed

@@ -109,7 +109,7 @@ class OCR:
         # Predict script language, here we assume "hindi" as the model name
         if self.verbose:
             print("Identifying script for the cropped area...")
-        script_lang = self.identifier.identify(cropped_path, "hindi")  # Use "hindi" as the model name
         # print(script_lang)
         # Clean up temporary file

         # Predict script language, here we assume "hindi" as the model name
         if self.verbose:
             print("Identifying script for the cropped area...")
+        script_lang = self.identifier.identify(cropped_path, "hindi", self.device)  # Use "hindi" as the model name
         # print(script_lang)
         # Clean up temporary file

IndicPhotoOCR/script_identification/vit/vit_infer.py CHANGED Viewed

@@ -135,11 +135,11 @@ class VIT_identifier:
-    def identify(self, image_path,model_name):
         model_path = self.ensure_model(model_name)
         vit = ViTForImageClassification.from_pretrained(model_path)
-        model= pipeline('image-classification', model=vit, feature_extractor=processor,device=0)
         if image_path.endswith((".png", ".jpg", ".jpeg")):

+    def identify(self, image_path,model_name, device):
         model_path = self.ensure_model(model_name)
         vit = ViTForImageClassification.from_pretrained(model_path)
+        model= pipeline('image-classification', model=vit, feature_extractor=processor,device=device)
         if image_path.endswith((".png", ".jpg", ".jpeg")):