-
Notifications
You must be signed in to change notification settings - Fork 0
/
app.py
61 lines (46 loc) · 1.63 KB
/
app.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
# invoice extractor
import google.generativeai as genai
from PIL import Image
import os
import streamlit as st
from dotenv import load_dotenv
load_dotenv()
# configure API key
genai.configure(api_key=os.getenv("GOOGLE_API_KEY"))
# function to load Gemini Pro vision model and get Response
def get_gemini_response(input, image, prompt):
model = genai.GenerativeModel("gemini-pro-vision")
response = model.generate_content([input, image[0], prompt])
return response.text
def input_image_setup(uploaded_file):
if uploaded_file is not None:
# read the file into bytes
bytes_data = uploaded_file.getvalue()
image_parts = [
{
"mime_type": uploaded_file.type,
"data": bytes_data
}
]
return image_parts
else:
raise FileNotFoundError("no file uploaded")
# initialize our streamlit app
st.set_page_config(page_title="Invoice extractor")
st.header("GEMINI Application")
input = st.text_input("Input prompt:", key="input")
submit = st.button('Submit')
uploaded_file = st.file_uploader(
"choose an image...", type=["jpg", "jpeg", "png"])
image = ''
if uploaded_file is not None:
image = Image.open(uploaded_file)
st.image(image, caption="uploaded image", use_column_width=True)
input_prompt = '''
you are expert in understanding invoices. you will recieve input images as invoices and you will have to answer questions based on input image.
'''
if submit:
image_data = input_image_setup(uploaded_file)
response = get_gemini_response(input_prompt, image_data, input)
st.subheader("The Response")
st.write(response)