Spaces:

yvesJR-237
/

Medical_scan_classification

Running

File size: 11,959 Bytes

import streamlit as st
import tensorflow as tf
from tensorflow.keras.layers import InputLayer
from PIL import Image
import numpy as np
# from .modules.tools import Analysing_image, text_to_speech
from gtts import gTTS
from transformers import BioGptTokenizer, AutoModelForCausalLM,  pipeline, TFAutoModel
from deep_translator import GoogleTranslator, MyMemoryTranslator
import tempfile
import os
# Set the page configuration

st.set_page_config(page_title="Medical Image Classifier & Chatbot", layout="wide")
st.title("Medical Image Classifier & Chatbot")
st.sidebar.header("Medical Analysis")
keys={'0':'Cyst', '1':'Normal', '2':'Stone', '3':'Tumor'}

def translate_text(text, source='auto', target='es'):
    translators = [GoogleTranslator, MyMemoryTranslator]
    
    for translator in translators:
        try:
            translation = translator(source=source, target=target).translate(text)
            print(f"{translator.__name__}: {translation}")
            return translation
        except Exception as e:
            print(f"{translator.__name__} failed: {e}")
    
    print("All translators failed. No translation found.")
    return None

def Analysing_image(st, model, image_file):
    try:
        # Open and display the image
        image = Image.open(image_file)
        st.image(image, caption="Uploaded Image", use_container_width=True)

        # Preprocess the image:
        # Ensure it is resized to the input dimensions your model expects (150x150 in this example)
        img_resized = image.resize((150, 150))
        img_array = np.array(img_resized).astype('float32') / 255.0

        # If the image is not 3 channels (some images might be grayscale), repeat channels if necessary
        if img_array.ndim == 2:
            img_array = np.stack((img_array,)*3, axis=-1)
        elif img_array.shape[2] == 1:
            img_array = np.concatenate([img_array]*3, axis=-1)

        # Add batch dimension
        img_batch = np.expand_dims(img_array, axis=0)

        # Run prediction
        predictions = model.predict(img_batch)

        st.write("Prediction probabilities:", predictions)

        # Assuming a multi-class classification where the class with the highest probability is selected:
        predicted_class = np.argmax(predictions, axis=1)
        st.write("Prediction :", keys[str(predicted_class[0])])
        return keys[str(predicted_class[0])]
    except:
        return None
    
# Function to convert text to speech
def text_to_speech(text):
    tts = gTTS(text)
    temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".mp3")
    tts.save(temp_file.name)
    return temp_file.name

@st.cache_resource  # Cache the model to avoid reloading on every interaction
def load_generator():
    # Use a medical-specific model like BioGPT or a general-purpose model like GPT-2
    tokenizer = BioGptTokenizer.from_pretrained("microsoft/BioGPT")
    model = AutoModelForCausalLM.from_pretrained("microsoft/BioGPT")
    return model, tokenizer

@st.cache_resource  # Cache the model to avoid reloading on every interaction
def load_summarizer():
    # Use a summarization model like "facebook/bart-large-cnn"
    summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
    return summarizer

# generator, tokenizer = load_generator()
generator = pipeline("text2text-generation", model="EleutherAI/gpt-neo-125M")
summarizer = load_summarizer()
translator = pipeline("translation_en_to_de", model="Helsinki-NLP/opus-mt-en-de")

image_file = st.sidebar.file_uploader("Upload an Image (.jpg, .jpeg, .png)", type=["jpg", "jpeg", "png"])
# Create tabs for each functionality
tab1, tab2, tab3, tab4 = st.tabs(["Classification", "Chatbot", "Translation & Summary", "Audio"])
predict_class = None
Summary = None

with tab1:
    # st.write("Upload your finalized model and an image to classify.")
    # Sidebar for uploading files   
    model_file = st.sidebar.file_uploader("Upload your Keras model (.h5 file)", type=["h5"])
   # Check if a model has been uploaded
    if model_file is not None:
        # Save the uploaded model file to disk
        with open("uploaded_model.h5", "wb") as f:
            f.write(model_file.getbuffer())
        st.sidebar.success("Model uploaded successfully!")
        
        # Attempt to load the model
        try:
            model = tf.keras.models.load_model("uploaded_model.h5")
            st.sidebar.info("Model loaded successfully!")
        except Exception as e:
            st.sidebar.error("Error loading model: " + str(e))
            st.stop()
        
        # Check if an image has been uploaded
        if image_file is not None:
           predict_class = Analysing_image(st, model, image_file)
        else:
            st.info("Please upload an image to classify.")
    else:
        st.info("Using Pretrained model")
        model = tf.keras.models.load_model("./models/medical_classifier/medical_classifier.h5")
        # model = TFAutoModel.from_pretrained('./models/medical_classifier')
        # config = model.config
        # if 'batch_shape' in config:
        #     config['input_shape'] = config.pop('batch_shape')[1:]  # Remove batch size
            
        # # Create the input layer with the corrected configuration
        # input_layer = InputLayer(**model.config)
        # # Rebuild the model (if necessary)
        # model.build(input_shape=model.config['input_shape'])

        if image_file is not None:
            predict_class = Analysing_image(st, model, image_file)
        else:
            st.info("Please upload an image to classify.")
# -----------------------------------------------------------------------------------------------

with tab2:
    if predict_class is not None:
        # # Create a prompt for the model
        if predict_class == 'Normal':
            prompt = f"What does it mean when the doctor say my IRM is Normal ?"
        else:
            if predict_class == "Cyst":
                prompt = f"What is brain cystic lesion ?"
            else:
                prompt = f"What is brain {predict_class} ?"
        # # Generate text using the Hugging Face model
        # with st.spinner("Generating description..."):
        #     inputs = tokenizer(prompt, return_tensors="pt")
        #     # Générer du texte
        #     output = generator.generate(
        #         inputs["input_ids"],
        #         max_length=300,  # Longueur maximale du texte généré
        #         num_return_sequences=1,  # Nombre de séquences à générer
        #         no_repeat_ngram_size=2,  # Éviter la répétition de phrases
        #         top_k=50,  # Contrôle la diversité du texte
        #         top_p=0.95,  # Contrôle la qualité du texte
        #         temperature=0.7,  # Contrôle la créativité du texte
        #     )
        
        #     # Décoder et afficher le texte généré
        #     # generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
        #     outputs = tokenizer.decode(output[0], skip_special_tokens=True)
        #     # output = generator(prompt, max_length=200, num_return_sequences=1)
        #     # st.session_state.chat_response = output[0]['generated_text']
        #     # st.session_state.chat_response = outputs

        #     # Decode the generated text, *excluding* the input prompt
        #     generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
        #     # Find the length of the original prompt
        #     prompt_length = len(tokenizer.decode(inputs["input_ids"][0], skip_special_tokens=True))
        #     # Extract the generated part of the text
        #     generated_response = generated_text[prompt_length:]
        #     st.session_state.chat_response = generated_response
        
        # medical_term = "myocardial infarction"
        # medical_term = prompt
        # description = generator(f"Explain the medical term: {medical_term}")

        user_input = st.text_area("Enter your prompt:", prompt)
        # Slider for controlling the length of the generated text
        max_length = st.slider("Max length of generated text", 50, 500, 100)   
        # Button to generate text
        if st.button("Generate Text"):
            with st.spinner("Generating text..."):
                # Generate text using the model
                output = generator(user_input, max_length=max_length, num_return_sequences=1)
                generated_text = output[0]['generated_text']
                # Display the generated text
                st.subheader("Description:")
                st.write(generated_text)
                # st.session_state.chat_response = outputs
                st.session_state.chat_response = generated_text
        
        # st.session_state.chat_response = outputs
        # st.session_state.chat_response = generated_text
        # Display the generated description
        # st.subheader("Generated Description:")
        # st.write(prompt, '--')
        # st.write(st.session_state.chat_response)


# Add translation and summary functionality
with tab3:
    st.header("Translation to German & Summary")
    if 'chat_response' in st.session_state and st.session_state.chat_response:
        medical_terms = st.session_state.chat_response
        # Translate to German
        # translator = GoogleTranslator(source='en', target='de')
        # german_translation = translator.translate(medical_terms)
        # Translate the text
        # translation = translate_text(medical_terms, target='de')
        translation = translator(medical_terms)
        outputs = 'Unable to translate, please Retry ...'
        if translation:
            outputs = translation[0]['translation_text']
            # st.subheader("Final Translation:")
            # st.write(translation)
        else:
            st.info("Unable to translate the text. Please try to refresh")
            if st.button('Refresh'):
                outputs = translator(prompt, target='de')
                outputs = outputs[0]['translation_text']

        # Create summary (simple example - in practice you might want to use a more sophisticated summarization method)
        # summary = " ".join(st.session_state.chat_response.split()[:30]) + "..."
        st.write("German Translation:", outputs)

        if st.button("Generate Summary"):
            if outputs != 'Unable to translate, please Retry ...':
                # Create a prompt for the model
                # prompt = f"{predict_class} is a medical condition that refers to "
                prompt = outputs
                # Generate a summary using the Hugging Face model
                with st.spinner("Generating summary..."):
                    # Summarize the prompt (you can adjust max_length and min_length)
                    summary = summarizer(prompt, max_length=85, min_length=60, do_sample=False)
                # Display the generated summary
                st.subheader("Generated Summary:")
                st.write(summary[0]['summary_text'])
            else:
                st.warning("Please enter a medical term.")
       
    else:
        st.info("No chatbot response available for translation and summary.")


# Add audio functionality
with tab4:
    st.header("Audio Output")
    if 'chat_response' in st.session_state and st.session_state.chat_response:
        # Convert chatbot response to audio
        audio_file = text_to_speech(st.session_state.chat_response)
        st.audio(audio_file)
        # Clean up temp file
        with open(audio_file, "rb") as file:
            btn = st.download_button(
                label="Download audio",
                data=file,
                file_name="chat_response.mp3",
                mime="audio/mpeg"
            )
        os.unlink(audio_file)
    else:
        st.info("No chatbot response available for audio conversion.")



print("Streamlit app updated with translation, summarization, and audio features.")