import streamlit as st import streamlit.components.v1 as components import numpy as np import pickle import pandas as pd pd.set_option('display.max_columns', 500) def impute_missing_values(df_,dict_impute): return df_.fillna(dict_impute) to_rescale_ = ['diff_MS','MS_d','pr_pre_tavi', 'surface_systole','MS_s','age', 'ncc_calcif_n','calc_risque_n'] to_encode_ = ['syncope_Oui', 'lcc_calc_1.0', 'bloc_branche_pre_bbd'] st.title("Pacemaker Implantation (IPM) risk prediction") st.subheader(f':red[Pre procedural] Tavi implantation model') cols = to_rescale_+to_encode_ with st.form(key='cols_form'): c1,c2= st.columns(2) c3,c4 = st.columns(2) c5,c6,c7,c8 = st.columns(4) c9,c10,c11 = st.columns(3) with c1: age = st.number_input('Age (year)',value=83) with c2: syncope_Oui = st.selectbox("Syncope",key="syncope",options=["Yes", "No"]) with c3: pr_pre_tavi = st.number_input('Pre-TAVI PR time (ms)',value=186) with c4: bloc_branche_pre_bbd = st.selectbox("Right bundle branch block",key="prebbd",options=["Yes", "No"]) with c5: lcc_calc_1 = st.selectbox("LCC calcification grade",key='lcccalc1',options=[0,1,2,3]) with c6: ncc_calcif_n = st.selectbox("NCC calcification grade",key='nccalcn',options=[0,1,2,3]) with c7: rcc_calcif_n = st.selectbox("RCC calcification grade",key='rccalcn',options=[0,1,2,3]) with c8: isc_calcif_n = st.selectbox("IS calcification",key='isccalcn',options=["Yes", "No"]) with c9: MS_s = st.number_input('Systolic membranous septal length(mm)',value=8.0) with c10: MS_d = st.number_input('Diastolic membranous septal length (mm)',value=8.9) with c11: surface_systole = st.number_input('Systolic aortic annular surface (mm²)',value=483) submitButton = st.form_submit_button(label = 'Predict') #load model, set cache to prevent reloading @st.cache_resource() def load_model(): with open(r"models/ensemble_models_pre.pkl", "rb") as input_file: models = pickle.load(input_file) return models #@st.cache_resource() def load_scaler(): with open(r"models/ensemble_scaler_pre.pkl", "rb") as input_file: scalers = pickle.load(input_file) return scalers @st.cache_resource() def load_impute(): with open(r"models/ensemble_dict_impute_pre.pkl", "rb") as input_file: dicts_impute = pickle.load(input_file) return dicts_impute with st.spinner("Loading Model...."): models = load_model() dicts_impute = load_impute() scalers = load_scaler() #st.write("Predicting Class...") with st.spinner("Prediction..."): # preprocessing diff_MS = MS_d - MS_s lcc_calc_1 = 1 if lcc_calc_1 == 1 else 0 syncope_Oui = 1 if syncope_Oui == "Yes" else 0 isc_calcif_n = 1 if isc_calcif_n == "Yes" else 0 bloc_branche_pre_bbd = 1 if bloc_branche_pre_bbd == "Yes" else 0 calc_risque_n = ncc_calcif_n + rcc_calcif_n + isc_calcif_n age = int(age)*365 bool_warning = False if MS_d<1.5 or MS_d>15.30: bool_warning = True if MS_s<2.0 or MS_s> 14.61: bool_warning = True if pr_pre_tavi<90 or pr_pre_tavi>344: bool_warning = True if surface_systole<300 or surface_systole>724: bool_warning = True if age<21156 or age>34939: bool_warning = True if bool_warning: st.write(":warning: Warning Results might not be reliable because:") if MS_d<1.5 or MS_d>15.30: st.write("Our study population had a dMS (mm) between 1.5 and 15.30 (mm)") if MS_s<2.0 or MS_s> 14.61: st.write("Our study population had a sMS (mm) between 2 and 14.61 (mm) ") if pr_pre_tavi<90 or pr_pre_tavi>344: st.write("Our study population had a pre-TAVI PR surface between 90 and 344 (ms)") if surface_systole<300 or surface_systole>724: st.write("Our study population had a systolic aortic annular surface between 300 and 724 (mm²) ") if age<21156 or age>34939: st.write("Our study population had an age between 58 and 95 years old ") pred_arr = np.array([[diff_MS,MS_d,pr_pre_tavi, surface_systole,MS_s,age, ncc_calcif_n,calc_risque_n, syncope_Oui, lcc_calc_1, bloc_branche_pre_bbd]]) pred_df = pd.DataFrame(pred_arr,columns=cols) print(pred_df.head()) pred_dfs = [impute_missing_values(pred_df,dict_impute) for dict_impute in dicts_impute] dfs_scaled_ = [scaler.transform(df_[to_rescale_]) for df_,scaler in zip(pred_dfs,scalers)] dfs_scaled = [pd.DataFrame(columns=to_rescale_,data=df_scaled_) for df_scaled_ in dfs_scaled_] dfs_cat = [pd.concat([df_scaled,pred_df[to_encode_]],axis=1) for df_scaled in dfs_scaled] pred= round( np.array([model.predict_proba(pred_df_)[0][1] for pred_df_,model in zip(dfs_cat,models)]).mean()*100,2) if pred>90: st.write("PMI risk probability >90 %") elif pred<10: st.write("PMI risk probability <10 %") else: st.write("PMI risk probability :",pred,' %')