Spaces:

Zabihin
/

Symptom-Diagnoses

Sleeping

App Files Files Community

Symptom-Diagnoses / app.py

Zabihin

Upload 8 files

fabc124 verified 5 months ago

raw history blame contribute delete

No virus

7.61 kB

	import streamlit as st
	from utils import get_data, diseases, metrics_table
	from transformers import pipeline
	import pandas as pd
	import io
	import json
	from openai import OpenAI
	import tensorflow as tf
	from transformers import TFAutoModelForSequenceClassification, AutoTokenizer


	# Load model
	model_name = "Zabihin/Symptom_to_Diagnosis"
	model = TFAutoModelForSequenceClassification.from_pretrained(model_name)
	tokenizer = AutoTokenizer.from_pretrained(model_name)


	def get_data(file:str):
	"""
	Reads data from a JSON file and returns the loaded data.

	Parameters:
	file (str): The path to the JSON file to be read.

	Returns:
	dict: The data loaded from the specified JSON file.
	"""
	with open(file) as files:
	data = json.load(files)
	return data


	def call_gpt3(api,prompt:str):
	client = OpenAI(api_key=api)

	response = client.chat.completions.create(
	model="gpt-3.5-turbo",
	messages=[
	{"role": "system", "content": "You are a doctor expert in drugs and diseases."},
	{"role": "user", "content": prompt}
	])

	generated_text = response.choices[0].message.content

	return generated_text


	# Define functions
	def get_predictions(text):
	inputs = tokenizer(text, return_tensors="tf", truncation=True, max_length=512)
	outputs = model(inputs)
	probabilities = tf.nn.softmax(outputs.logits, axis=-1)
	predictions = []
	for idx, prob in enumerate(probabilities[0]):
	label = model.config.id2label[idx]
	predictions.append((label, prob.numpy()))
	return predictions

	def analyze_probabilities(predictions):
	probabilities = [prob for _, prob in predictions]
	max_prob = max(probabilities)
	high_prob_label = next(label for label, prob in predictions if prob == max_prob)
	return high_prob_label,max_prob


	def main():
	# import symptoms data
	symptoms = get_data('symptomes.json')

	# Create sidebar and pages content
	tabs = ["Home", "About Us", "Model Details & Evaluations"]
	st.sidebar.header("Welcome to the Symptom checker app ! This app provide diagnosis based on your symptoms. Feel free to try it out !")
	st.sidebar.divider()
	active_tab = st.sidebar.radio("Select Tab", tabs)
	if active_tab == "Home":
	st.header("Symptom Checker and Diagnosis App", divider = 'violet')
	image_path = "symptom.webp"
	col1, col2 = st.columns(2)
	with col1:
	st.image(image_path, use_column_width='auto')
	with col2:
	st.subheader("👩‍⚕️ Enter your symptoms:")
	st.subheader("get your diagnosis and useful advices")

	input_text = ""
	for category, symptoms in symptoms.items():
	st.sidebar.write(f"### {category}")
	category_symptoms = st.sidebar.multiselect(f"Select Symptoms in {category}", [symptom[0] for symptom in symptoms])
	if category_symptoms:
	input_text += f""
	for selected_symptom in category_symptoms:
	symptom_description = next((symptom[1] for symptom in symptoms if symptom[0] == selected_symptom), "")
	input_text += f"{symptom_description}\n"

	# Display the updated input_text
	manual_input=st.text_area("Symptoms", value=input_text, height=200)

	st.warning("If you want to know more, please enter your api key and click on submit: ")
	with st.expander("Click here to enter your api"):
	api=st.text_input("API KEY", value="",type='password')

	# Button to submit and get the predicted label
	if st.button("Submit"):
	predictions = get_predictions(manual_input)
	predicted_label,probability=analyze_probabilities(predictions)

	# Condition to display only high probability deseases
	if probability > 0.6:
	st.success(f"Based on your symptoms, there's a {100 * probability:.2f}% probability that you might have {predicted_label}.")

	if api:

	# Try using the provided API key to call GPT-3
	gpt3_prompt = f"Please provide a list of medications for {predicted_label}, along with a brief explanation of this disease."
	#gpt3_response = call_gpt3(api, gpt3_prompt)

	try :
	gpt3_response = call_gpt3(api,gpt3_prompt)
	# Display the GPT-3 response if successful
	st.header(f'Information about the {predicted_label}')
	st.info('Please note: This information is AI-generated and does not replace professional medical advice.')
	st.write(gpt3_response)

	except:
	# Handle case where API call fails
	st.warning("Unable to retrieve information using the provided API key. Please try another API key if available.")
	else:
	st.write('If you want to know more, please enter your api key')
	else:
	st.warning("The symptoms you've described do not strongly indicate any of the 22 diseases in our database with a high probability. It's recommended to consult a healthcare professional for a more accurate diagnosis.")
	# Expander to show the list of diseases
	with st.expander("Click here to view the list of diseases"):
	for disease in diseases:
	st.write(disease)

	elif active_tab == "About Us":
	st.title("GZ-Health")

	st.markdown("[Zahra ZABIHINPOUR](https://www.linkedin.com/in/zahra-zabihinpour/)")
	st.markdown("[Kevin GOUPIL](https://www.linkedin.com/in/kevin-goupil/)")
	st.markdown(" We are a dynamic duo of data scientists collaborating to enhance our skills and stay at the forefront of the latest developments. With backgrounds in science and experience working with health data, we bring a unique blend of expertise to our data science projects. Our shared passion and commitment drive us to showcase and elevate our capabilities through innovative and impactful initiatives. Join us on this journey of continuous improvement and exploration in the world of data science. ")
	st.markdown(" ")

	elif active_tab == "Model Details & Evaluations":
	st.subheader("Model Overview:")
	st.write("This model is a fine-tuned adaptation of the bert-base-cased architecture, specifically designed for text classification tasks associated with diagnosing diseases based on symptoms. The primary goal is to scrutinize natural language symptom descriptions and accurately predict one of 22 potential diagnoses.")
	st.subheader("Dataset Information:")
	st.write("The model was trained on the Gretel/symptom_to_diagnosis dataset, which consists of 1,065 symptom descriptions in English, each labeled with one of the 22 possible diagnoses. This dataset focuses on detailed, fine-grained, single-domain diagnosis, making it suitable for tasks requiring nuanced symptom classification. For those interested in utilizing the model, the Symptom Checker and Diagnosis App, or the Inference API, are accessible at [https://huggingface.co/Zabihin/Symptom_to_Diagnosis](https://huggingface.co/Zabihin/Symptom_to_Diagnosis).")
	st.subheader("Model Performance Metrics:")
	metrics_data = pd.read_csv(io.StringIO(metrics_table), sep="\|").dropna()
	st.table(metrics_data)



	if __name__ == "__main__":
	main()