Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -122,7 +122,7 @@ def extract_data_from_pdfs(docs, session, include_images, progress=gr.Progress()
|
|
122 |
|
123 |
images = []
|
124 |
for doc in docs:
|
125 |
-
ocrmypdf.ocr(doc, "ocr.pdf", deskew=True,
|
126 |
text = extract_text("ocr.pdf")
|
127 |
all_text += clean_text(text) + "\n\n"
|
128 |
if include_images == "Include Images":
|
|
|
122 |
|
123 |
images = []
|
124 |
for doc in docs:
|
125 |
+
ocrmypdf.ocr(doc, "ocr.pdf", deskew=True, force_ocr=True)
|
126 |
text = extract_text("ocr.pdf")
|
127 |
all_text += clean_text(text) + "\n\n"
|
128 |
if include_images == "Include Images":
|