rakib72642
/

Arabic_OCR

Model card Files Files and versions Community

rakib72642 commited on Apr 16, 2024

Commit

e92bd0b

1 Parent(s): 599b1f8

demo structure

Browse files

Files changed (7) hide show

a.jpg +0 -0
a.py +40 -0
api.py +47 -0
img/a.png +0 -0
main.py +26 -0
new.jpg +0 -0
test.ipynb +106 -0

a.jpg ADDED Viewed

a.py ADDED Viewed

	@@ -0,0 +1,40 @@

+from easyocr import Reader
+import cv2
+def cleanup_text(text):
+	# strip out non-ASCII text so we can draw the text on the image
+	# using OpenCV
+	return "".join([c if ord(c) < 128 else "" for c in text]).strip()
+def arabic_ocr(image_path,out_image):
+  # break the input languages into a comma separated list
+  langs = "ar,en".split(",")
+  gpu1=-1
+  #print("[INFO] OCR'ing with the following languages: {}".format(langs))
+# load the input image from disk
+  image = cv2.imread(image_path)
+# OCR the input image using EasyOCR
+  print("[INFO] OCR'ing input image...")
+  reader = Reader(langs, gpu=-1 > 0)
+  results = reader.readtext(image)
+  #print(result)
+  # loop over the results
+  filename=out_image
+  for (bbox, text, prob) in results:
+    # display the OCR'd text and associated probability
+    print("[INFO] {:.4f}: {}".format(prob, text))
+    # unpack the bounding box
+    (tl, tr, br, bl) = bbox
+    tl = (int(tl[0]), int(tl[1]))
+    tr = (int(tr[0]), int(tr[1]))
+    br = (int(br[0]), int(br[1]))
+    bl = (int(bl[0]), int(bl[1]))
+    # cleanup the text and draw the box surrounding the text along
+    # with the OCR'd text itself
+    text = cleanup_text(text)
+    cv2.rectangle(image, tl, br, (0, 255, 0), 2)
+    cv2.putText(image, text, (tl[0], tl[1] - 10),
+      cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 255, 0), 2)
+  # show the output image
+  cv2.imwrite(filename, image)
+  return results

api.py ADDED Viewed

	@@ -0,0 +1,47 @@

+import urllib.request
+from fastapi import FastAPI
+from pydantic import BaseModel
+import json
+from io import BytesIO
+import asyncio
+from aiohttp import ClientSession
+import torch
+from main import main_det
+import uvicorn
+import urllib
+app = FastAPI()
+class Item(BaseModel):
+    url: str
+async def process_item(item: Item):
+    try:
+        urllib.request.urlretrieve(item.url,"new.jpg")
+        result = await main_det("new.jpg")
+        result = json.loads(result)
+        return result
+    except:
+        pass
+@app.get("/status")
+async def status():
+    return "AI Server in running"
+@app.post("/ocr")
+async def create_items(items: Item):
+    try:
+        # print(items)
+        results = await process_item(items)
+        print("#"*100)
+        return results
+    except Exception as e:
+        return {"AI": f"Error: {str(e)}"}
+    finally:
+        torch.cuda.empty_cache()
+if __name__ == "__main__":
+    uvicorn.run(app, host="127.0.0.1", port=8000)

img/a.png ADDED Viewed

main.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from ArabicOcr import arabicocr
+import json
+import numpy as np
+from io import BytesIO
+from PIL import Image
+from aiohttp import ClientSession
+async def getImage(img_url):
+    async with ClientSession() as session:
+        async with session.get(img_url) as response:
+            img_data = await response.read()
+            return BytesIO(img_data)
+async def main_det(image):
+    try:
+        # image_path = image
+        out = "data.jpg"
+        results=await arabicocr.arabic_ocr(image,"a.jpg")
+        print(results)
+        words=[]
+        for i in range(len(results)):
+                word=results[i][1]
+                words.append(word)
+        return json.dumps({"prediction":words})
+    except Exception as e:
+        raise ValueError(f"Error in main_det: {str(e)}")

new.jpg ADDED Viewed

test.ipynb ADDED Viewed

	@@ -0,0 +1,106 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from ArabicOcr import arabicocr\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Using CPU. Note: This module is much faster with a GPU.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[INFO] OCR'ing input image...\n",
+      "[INFO] 0.4919: بدأ فيأ حلم عرب ختم فيأ مهرج بحر حلم\n",
+      "[INFO] 0.2563: لدعط\n",
+      "[INFO] 0.8595: بكر يواصل سيناريو\n",
+      "[INFO] 0.6365: عبدالرحمن دخيل تماماًكون متوقعاً ضبط\n",
+      "[INFO] 0.4543: أتي مهرج بحر دول للأغنية صور هزيلاً\n",
+      "[INFO] 0.6843: فاشلا فيأكلأ شيء نظم سيىء جمل\n",
+      "[INFO] 0.6381: جمل حدث دراماتيكية يسعني الاان اقف\n",
+      "[INFO] 0.9383: سيناريو تراجيدي\n",
+      "[INFO] 0.3568: منتسماً\n",
+      "[INFO] 0.2621: ددوا\n",
+      "[INFO] 0.7647: عمل فيأ\n",
+      "[INFO] 0.5875: فصل منامة . كلأ هتم\n",
+      "[INFO] 0.9771: كتب\n",
+      "[INFO] 0.9535: للفنانين\n",
+      "[INFO] 0.7544: أسي\n",
+      "[INFO] 0.9973: حدث\n",
+      "[INFO] 0.9826: فني\n",
+      "{'Extracted': ['بدأ فيأ حلم عرب ختم فيأ مهرج بحر حلم', 'لدعط', 'بكر يواصل سيناريو', 'عبدالرحمن دخيل تماماًكون متوقعاً ضبط', 'أتي مهرج بحر دول للأغنية صور هزيلاً', 'فاشلا فيأكلأ شيء نظم سيىء جمل', 'جمل حدث دراماتيكية يسعني الاان اقف', 'سيناريو تراجيدي', 'منتسماً', 'ددوا', 'عمل فيأ', 'فصل منامة . كلأ هتم', 'كتب', 'للفنانين', 'أسي', 'حدث', 'فني']}\n"
+     ]
+    }
+   ],
+   "source": [
+    "image_path='img/a.png'\n",
+    "out_image='out/out.jpg'\n",
+    "results=arabicocr.arabic_ocr(image_path,out_image)\n",
+    "# print(results)\n",
+    "words=[]\n",
+    "for i in range(len(results)):\t\n",
+    "\t\tword=results[i][1]\n",
+    "\t\t# print(word)\n",
+    "\t\twords.append(word)\n",
+    "data = {\"Extracted\":words}\n",
+    "print(data)\n",
+    "# with open ('file.txt','w',encoding='utf-8')as myfile:\n",
+    "# \t\tmyfile.write(str(words))\n",
+    "# import cv2\n",
+    "# img = cv2.imread('out/out.jpg', cv2.IMREAD_UNCHANGED)\n",
+    "# cv2.imshow(\"arabic ocr\",img)\n",
+    "# cv2.waitKey(0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "arabic",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.2"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}