import gradio as gr
import joblib
import numpy as np
import pandas as pd
from huggingface_hub import hf_hub_download
from sklearn.preprocessing import StandardScaler, OneHotEncoder, LabelEncoder

# Load the trained model and scaler objects from file


REPO_ID = "Hemg/modelxxx" # hugging face  repo ID
MoDEL_FILENAME = "studentpredict.joblib" # model file name
SCALER_FILENAME ="studentscaler.joblib" # scaler file name

model = joblib.load(hf_hub_download(repo_id=REPO_ID, filename=MoDEL_FILENAME))

scaler = joblib.load(hf_hub_download(repo_id=REPO_ID, filename=SCALER_FILENAME))
 
def encode_categorical_columns(df):
    label_encoder = LabelEncoder()
    ordinal_columns = df.select_dtypes(include=['object']).columns

    for col in ordinal_columns:
        df[col] = label_encoder.fit_transform(df[col])

    nominal_columns = df.select_dtypes(include=['object']).columns.difference(ordinal_columns)
    df = pd.get_dummies(df, columns=nominal_columns, drop_first=True)

    return df

# Define the prediction function
def predict_performance(Location, College_Fee,College, GPA, Year, Course_Interested, Faculty, Source, 
                       Visited_College_for_Inquiry_Only, Event, Attended_Any_Events, 
                       Presenter, Visited_Parents):
    
    input_data = [[Location, College_Fee,College, GPA, Year, Course_Interested, Faculty, Source,
                 Visited_College_for_Inquiry_Only, Event, Attended_Any_Events,
                 Presenter, Visited_Parents]]

    feature_names = ["Location", "College Fee", "GPA", "Year", "Course Interested",
                 "Faculty", "Source", "Visited College for Inquiry Only", "Event",
                 "Attended Any Events", "College", "Presenter", "Visited Parents"]
    
    input_df = pd.DataFrame(input_data, columns=feature_names)
    
    # Debug print 2: Show DataFrame before encoding
    print("\nDataFrame before encoding:")
    print(input_df)
    
    df = encode_categorical_columns(input_df)
    
    # Debug print 3: Show DataFrame after encoding
    print("\nDataFrame after encoding:")
    print(df)
    
    # Ensure the DataFrame columns match the scaler's expected input
    df = df.reindex(columns=scaler.feature_names_in_, fill_value=0)
    
    scaled_input = scaler.transform(df)
    
    # Debug print 4: Show scaled input
    print("\nScaled input:")
    print(scaled_input)
    
    prediction = model.predict(scaled_input)[0]
    
    # Debug print 5: Show prediction details
    print("\nPrediction details:")
    print(f"Raw prediction: {prediction}")
    prediction_probability = 1 / (1 + np.exp(-prediction))
    print(f"Probability: {prediction_probability}")
    prediction_percentage = prediction_probability * 100
    print(f"Percentage: {prediction_percentage}")
    
    return f"Chance of Admission: {prediction_percentage:.1f}%"
 
iface = gr.Interface(
    fn=predict_performance,
    inputs=[
        gr.Radio(["Kathmandu", "Bhaktapur", "Lalitpur", "Kritipur"], label="Location"),
        gr.Slider(minimum=1000000, maximum=1700000, label="College Fee"),
        gr.Slider(minimum=2, maximum=3, label="GPA"),
        gr.Slider(minimum=2024, maximum=2024, step=1, label="Year"),
        gr.Radio(["MSc IT & Applied Security", "BSc (Hons) Computing", "BSc (Hons) Computing with Artificial Intelligence", 
                 "BSc (Hons) Computer Networking & IT Security", "BSc (Hons) Multimedia Technologies", "MBA", 
                 "BA (Hons) Accounting &  Finance", "BA (Hons) Business Administration"], label="Course_Interested"),
        gr.Radio(["Science", "Management", "Humanities"], label="Faculty"),
        gr.Radio(["Event", "Facebook", "Instagram", "Offline", "Recommendation"], label="Source"),
        gr.Radio(["Yes", "No"], label="visited_college_for_inquery_only"),
        gr.Radio(["New Year", "Dashain", "Orientation", "Fresher's Party", "Holi Festival", "Welcome Ceremony"], 
                label="attended_event_name"),
        gr.Radio(["Yes", "No"], label="attended_any_event"),
        gr.Radio(["Trinity", "CCRC", "KMC", "SOS", "ISMT", "St. Xavier's", "Everest", "Prime"], label="College"),
        gr.Radio(["Ram", "Gita", "Manish", "Shyam", "Raj", "Hari", "Rina", "Shree"], label="Presenter"),
        gr.Radio(["Yes", "No"], label="visited_with_parents")  # Removed the incorrect list here
    ],
    outputs="text",
    title="chances of student admission",
    description="chances of student admission"
)

# Run the app
if __name__ == "__main__":
    iface.launch(share=True)