Spaces:

darthPanda
/

invoice_extractor

Sleeping

App Files Files Community

darthPanda commited on Feb 14

Commit

7110704

•

1 Parent(s): 8c3ae58

added simple api call

Browse files

Files changed (4) hide show

.gitignore +0 -0
app.py +25 -0
requirements.txt +6 -0
utils.py +67 -0

.gitignore ADDED Viewed

File without changes

app.py ADDED Viewed

	@@ -0,0 +1,25 @@

+import os
+import streamlit as st
+import utils
+# Set up the sidebar
+# Ask the user for an API key in the sidebar
+os.environ["OPENAI_API_KEY"] = st.sidebar.text_input("OpenAI API Key", type="password")
+# Main body of the app
+# Display a title
+st.title("Invoice Data Extractor")
+if os.environ["OPENAI_API_KEY"] == "":
+    disable_file_uploader = True
+    st.error('Kindly enter OpenAI API key')
+else:
+    disable_file_uploader = False
+# Add a file uploader widget
+uploaded_file = st.file_uploader("Upload invoice image", type=['png', 'jpg'], disabled=disable_file_uploader)
+if uploaded_file is not None:
+    response = utils.pass_to_openai_vision_api(uploaded_file)
+    st.write('Data extracted from invoice is ')
+    st.write(response)

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+streamlit==1.25.0
+llama-index-callbacks-wandb
+llama-index-llms-openai
+llama-index-multi-modal-llms-openai
+openai
+matplotlib

utils.py ADDED Viewed

	@@ -0,0 +1,67 @@

+import base64
+import requests
+import os
+def pass_to_openai_vision_api(image):
+    # OpenAI API Key
+    api_key = os.environ["OPENAI_API_KEY"]
+    # Getting the base64 string
+    base64_image = base64.b64encode(image.read()).decode('utf-8')
+    headers = {
+    "Content-Type": "application/json",
+    "Authorization": f"Bearer {api_key}"
+    }
+    gpt_prompt='''Above is the text extracted from an invoice.
+You are an assistant tasked with extracting information from the invoice. Do this step by step.
+1. First extract the date and due date.
+2. Then assign it a category (e.g Food).
+3. Extract the invoice number and vendor account number.
+4. Extract the total amount.
+5. Extract the items along with their name, quantity and individual price.
+Output should only contain a dictionary in the following format
+{
+    "Date": None,
+    "Due Date": None,
+    "Category": None,
+    "Invoice Number": None,
+    "Vendor Account Number": None,
+    "Total Amount": None,
+    "Items": [
+        {
+            "Item": None,
+            "Quantity": None,
+            "Individual Price": None
+        }
+    ]
+}
+If a key is not mentioned in invoice or you dont understand, then make its value None
+'''
+    payload = {
+    "model": "gpt-4-vision-preview",
+    "messages": [
+        {
+        "role": "user",
+        "content": [
+            {
+            "type": "text",
+            "text": gpt_prompt
+            },
+            {
+            "type": "image_url",
+            "image_url": {
+                "url": f"data:image/jpeg;base64,{base64_image}"
+            }
+            }
+        ]
+        }
+    ],
+    "max_tokens": 300   # To be investigated
+    }
+    response = requests.post("https://api.openai.com/v1/chat/completions", headers=headers, json=payload)
+    return response.json()['choices'][0]['message']['content']