-
Notifications
You must be signed in to change notification settings - Fork 5
/
app.py
61 lines (48 loc) · 1.85 KB
/
app.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
from PIL import Image
import google.generativeai as genai
import os # for environment variables
import streamlit as st
from dotenv import load_dotenv
load_dotenv() # take environment variables from .env.
genai.configure(api_key=os.getenv("GOOGLE_API_KEY"))
# Function to load Gemini Pro vision
model = genai.GenerativeModel('gemini-pro-vision')
def get_gemini_response(input, image, prompt):
response = model.generate_content([input, image[0], prompt])
return response.text
def input_image_setup(uploaded_file):
if uploaded_file is not None:
bytes_data = uploaded_file.getvalue()
image_parts = [
{
'mime_type': uploaded_file.type,
'data': bytes_data
}
]
return image_parts
else:
raise FileNotFoundError("File not found")
# streamlit app
st.set_page_config(page_title="Multi Language invoice extractor")
st.header("Multi Language invoice extractor")
st.subheader("Extract information from invoices in multiple languages")
input = st.text_input("Input Prompt: ", key="input")
uploaded_file = st.file_uploader(
"Upload Invoice", type=["png", "jpg", "jpeg"], key="image")
if uploaded_file is not None:
image = Image.open(uploaded_file)
st.image(image, caption='Uploaded Image.', use_column_width=True)
submit = st.button("Extract")
input_prompt = """
You are an expert in invoice extraction. we will show you an invoice and you will tell us what information you want to extract from it.
"""
if submit:
if input == "":
st.write("Please enter a prompt")
elif uploaded_file is None:
st.write("Please upload an invoice")
else:
image_parts = input_image_setup(uploaded_file)
response = get_gemini_response(input_prompt, image_parts, input)
st.subheader("Extracted Information")
st.write(response)