Spaces:
Runtime error
Runtime error
# Import the libraries | |
import gradio as gr | |
import pandas as pd | |
import joblib | |
from sklearn.preprocessing import OneHotEncoder | |
import subprocess | |
import json | |
import uuid | |
from pathlib import Path | |
from huggingface_hub import CommitScheduler | |
# Run the training script placed in the same directory as app.py | |
# The training script will train and persist a linear regression | |
# model with the filename 'model.joblib' | |
# Load the freshly trained model from disk | |
# model = joblib.load('/content/dt_regressor.pkl') # Uncomment this line to use Decision Tree model | |
model = joblib.load('model.joblib') # Linear Regression model | |
# Prepare the logging functionality | |
log_file = Path("logs/") / f"data_{uuid.uuid4()}.json" | |
log_folder = log_file.parent | |
scheduler = CommitScheduler( | |
repo_id="debjaninath/insurance-charge-mlops-logs", # provide a name "insurance-charge-mlops-logs" for the repo_id | |
repo_type="dataset", | |
folder_path=log_folder, | |
path_in_repo="data", | |
every=2 | |
) | |
# Define the predict function which will take features, convert to dataframe and make predictions using the saved model | |
# the functions runs when 'Submit' is clicked or when a API request is made | |
def predict_charges(age, bmi, children, sex, smoker, region): | |
try: | |
# Create a DataFrame from the input features | |
data = pd.DataFrame({ | |
'age': [age], | |
'bmi': [bmi], | |
'children': [children], | |
'sex': [sex], | |
'smoker': [smoker], | |
'region': [region] | |
}) | |
# Handle categorical variables using one-hot encoding | |
data = pd.get_dummies(data) | |
# Ensure the input data has the same features as the training data | |
train_columns = model.feature_names_in_ | |
missing_columns = set(train_columns) - set(data.columns) | |
for column in missing_columns: | |
data[column] = 0 | |
data = data[train_columns] | |
print("Input data:") | |
print(data) | |
# Make predictions using the loaded model | |
prediction = model.predict(data) | |
print("Prediction:", prediction) | |
# Check if prediction is not None and has at least one element | |
if prediction is not None and len(prediction) > 0: | |
# While the prediction is made, log both the inputs and outputs to a log file | |
# While writing to the log file, ensure that the commit scheduler is locked to avoid parallel | |
# access | |
with scheduler.lock: | |
with log_file.open("a") as f: | |
f.write(json.dumps( | |
{ | |
'age': age, | |
'bmi': bmi, | |
'children': children, | |
'sex': sex, | |
'smoker': smoker, | |
'region': region, | |
'prediction': prediction[0] | |
} | |
)) | |
f.write("\n") | |
return float(prediction[0]) |