anand004 commited on
Commit
68093d8
·
verified ·
1 Parent(s): f55139c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -122,7 +122,7 @@ def extract_data_from_pdfs(docs, session, include_images, progress=gr.Progress()
122
 
123
  images = []
124
  for doc in docs:
125
- ocrmypdf.ocr(doc, "ocr.pdf", deskew=True, skip_text=True, output_type="pdf")
126
  text = extract_text("ocr.pdf")
127
  all_text += clean_text(text) + "\n\n"
128
  if include_images == "Include Images":
 
122
 
123
  images = []
124
  for doc in docs:
125
+ ocrmypdf.ocr(doc, "ocr.pdf", deskew=True, force_ocr=True)
126
  text = extract_text("ocr.pdf")
127
  all_text += clean_text(text) + "\n\n"
128
  if include_images == "Include Images":