adit94's picture
Rename s3_uiapp.py to app.py
78ddddf verified
raw
history blame
No virus
1.9 kB
import os
import time
import uuid
import streamlit as st
from helpers.entity_extraction_helpers import process_insurance_document
from services.pii_service import PIIService
from services.openai_service import OpenAIService
from services.mongo_service import MongoService
from services.ocr_service import OCRService
def init_session():
print("------------------ Initializing")
if 'a' not in st.session_state:
st.session_state['pii_instance'] = PIIService()
print("PII service initialized")
time.sleep(2)
st.session_state['openai_instance'] = OpenAIService(st.secrets["OPENAI_KEY"],
st.secrets["OPENAI_AZURE_ENDPOINT"],
st.secrets["OPENAI_API_VERSION"],
st.secrets["DEPLOYMENT_NAME"])
print("OpenAI service initialized")
time.sleep(2)
st.session_state['ocr_instance'] = OCRService()
print("OCR service initialized")
st.session_state.a = 1
print("-----------------------------")
st.header('', divider='rainbow')
st.title("Data extraction")
st.header('', divider='rainbow')
init_session()
uploaded_doc = st.file_uploader("Upload an insurance document", type=["pdf"])
if uploaded_doc is not None:
with open(uploaded_doc.name,"wb") as f:
f.write(uploaded_doc.getbuffer())
document_id = str(uuid.uuid4())
print(f"File uploaded :: {uploaded_doc.name} :: {document_id}")
process_out = process_insurance_document(st.session_state['pii_instance'], "", st.session_state['openai_instance'],
st.session_state['ocr_instance'] , uploaded_doc.name, document_id)
st.header('Extracted entities !! ', divider='rainbow')
st.write(process_out['entities'])
st.header('', divider='rainbow')
### TO RUN :: streamlit run ui_app.py