gp30-deployment / app.py
cccmatthew's picture
Model_serving
4cc2a8a
raw
history blame
No virus
4.65 kB
import streamlit as st
import requests
import csv
import datetime
import time
import pandas as pd
import matplotlib.pyplot as plt
import os
##########################
SECRET = os.environ["api_secret"]
headers = {"Authorization": "Bearer " + SECRET}
API_URL = "https://api-inference.huggingface.co/models/cccmatthew/model_test"
##########################
def load_response_times():
try:
df = pd.read_csv('model_interactions.csv', usecols=["Timestamp", "Response Time"])
df['Timestamp'] = pd.to_datetime(df['Timestamp'])
return df
except Exception as e:
st.error(f"Failed to read response times: {e}")
return pd.DataFrame()
def plot_response_times(df):
if not df.empty:
plt.figure(figsize=(10, 5))
plt.plot(df['Timestamp'], df['Response Time'], marker='o', linestyle='-')
plt.title('Response Times Over Time')
plt.xlabel('Timestamp')
plt.ylabel('Response Time (seconds)')
plt.grid(True)
st.pyplot(plt)
else:
st.write("No response time data to display.")
#Function to setup the logs ina csv file
def setup_csv_logger():
with open('model_interactions.csv', 'a', newline='') as file:
writer = csv.writer(file)
#The headers will be written if not present
if file.tell() == 0:
writer.writerow(["Timestamp", "User Input", "Model Prediction", "Response Time"])
def log_to_csv(sentence, results, response_time):
with open('model_interactions.csv', 'a', newline='') as file:
writer = csv.writer(file)
writer.writerow([datetime.datetime.now(), sentence, results, response_time])
setup_csv_logger()
st.title('Group 30 - DistilBERT')
st.write('This application uses DistilBERT to classify Abbreviations (AC) and Long Forms (LF)')
example_sentences = [
"RAFs are plotted for a selection of neurons in the dorsal zone (DZ) of auditory cortex in Figure 1.",
"Light dissolved inorganic carbon (DIC) resulting from the oxidation of hydrocarbons.",
"Images were acquired using a GE 3.0T MRI scanner with an upgrade for echo-planar imaging (EPI)."
]
sentence = st.selectbox('Choose an example sentence or type your own below:', example_sentences + ['Custom Input...'])
if sentence == 'Custom Input...':
sentence = st.text_input('Input your sentence here:', '')
def merge_entities(sentence, entities):
entities = sorted(entities, key=lambda x: x['start'])
annotated_sentence = ""
last_end = 0
for entity in entities:
annotated_sentence += sentence[last_end:entity['start']]
annotated_sentence += f"<mark style='background-color: #ffcccb;'><b>{sentence[entity['start']:entity['end']]}</b> [{entity['entity_group']}]</mark>"
last_end = entity['end']
annotated_sentence += sentence[last_end:]
return annotated_sentence
def send_request_with_retry(url, headers, json_data, retries=5, backoff_factor=10):
"""Send request with retries on timeouts and HTTP 503 errors."""
for attempt in range(retries):
start_time = time.time()
try:
response = requests.post(url, headers=headers, json=json_data)
response.raise_for_status()
response_time = time.time() - start_time
return response, response_time
except requests.exceptions.HTTPError as e:
if response.status_code == 503:
st.info('Server is unavailable, retrying...')
else:
raise
except (requests.exceptions.ConnectionError, requests.exceptions.Timeout) as e:
st.info(f"Network issue ({str(e)}), retrying...")
time.sleep(backoff_factor * (2 ** attempt))
st.error("Failed to process request after several attempts.")
return None, None
if st.button('Classify'):
if sentence:
API_URL = API_URL
headers = headers
response, response_time = send_request_with_retry(API_URL, headers, {"inputs": sentence})
if response is not None:
results = response.json()
st.write('Results:')
annotated_sentence = merge_entities(sentence, results)
st.markdown(annotated_sentence, unsafe_allow_html=True)
log_to_csv(sentence, results, response_time)
df = load_response_times()
plot_response_times(df)
else:
st.error("Unable to classify the sentence due to server issues.")
else:
st.error('Please enter a sentence.')
#Separate button to just plot the response time
if st.button('Show Response Time'):
df = load_response_times()
plot_response_times(df)