EddieXIA commited on
Commit
9c5e00f
1 Parent(s): 4477f45

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +40 -0
app.py ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Import necessary libraries
2
+ import streamlit as st
3
+ from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
4
+ import PyPDF2
5
+ import pytesseract
6
+ from PIL import Image
7
+
8
+ # Load StarCoder model and tokenizer
9
+ model_name = "starcoder-plus" # Replace with the correct model name
10
+ model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
11
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
12
+
13
+ # Streamlit app
14
+ st.title("Conversational AI Chatbot")
15
+
16
+ # User input for code-related question
17
+ user_input = st.text_input("Enter your code-related question:")
18
+ if user_input:
19
+ # Tokenize and generate code
20
+ inputs = tokenizer(user_input, return_tensors="pt")
21
+ outputs = model.generate(**inputs)
22
+ code = tokenizer.decode(outputs[0])
23
+ st.code(code) # Display the generated code
24
+
25
+ # User input for PDF reading
26
+ pdf_file = st.file_uploader("Upload a PDF file:", type=["pdf"])
27
+ if pdf_file:
28
+ pdf_reader = PyPDF2.PdfFileReader(pdf_file)
29
+ pdf_text = ""
30
+ for page_num in range(pdf_reader.numPages):
31
+ page = pdf_reader.getPage(page_num)
32
+ pdf_text += page.extractText()
33
+ st.text(pdf_text) # Display the extracted text
34
+
35
+ # User input for OCR (image to text)
36
+ image_file = st.file_uploader("Upload an image for OCR:", type=["png", "jpg", "jpeg"])
37
+ if image_file:
38
+ image = Image.open(image_file)
39
+ ocr_text = pytesseract.image_to_string(image)
40
+ st.text(ocr_text) # Display the extracted text