Spaces:

VinnoGS
/

Insurance7

Sleeping

App Files Files Community

Insurance7 / app.py

VinnoGS

Upload 5 files

9252403 verified over 1 year ago

raw

history blame contribute delete

3.68 kB

	# Import the libraries
	import joblib
	import pandas as pd
	import numpy as np
	import json
	import uuid
	from pathlib import Path
	import gradio as gr
	from sklearn.compose import make_column_transformer
	from sklearn.preprocessing import StandardScaler, OneHotEncoder
	from sklearn.impute import SimpleImputer
	from sklearn.pipeline import Pipeline


	# Run the training script placed in the same directory as app.py
	# The training script will train and persist a linear regression
	# model with the filename 'model.joblib'
	exec(open("train.py").read())

	#from commit_scheduler import CommitScheduler

	# Load the freshly trained model from disk
	saved_model = joblib.load("random_forest_pipeline.pkl")
	print("Model loaded from random_forest_pipeline.pkl")

	# Prepare the logging functionality
	log_file = Path("logs/") / f"data_{uuid.uuid4()}.json"
	log_folder = log_file.parent
	log_folder.mkdir(parents=True, exist_ok=True)

	# Simple lock mechanism for logging
	class SimpleLock:
	def __init__(self, lock_file="lockfile"):
	self.lock_file = Path(lock_file)

	def __enter__(self):
	while self.lock_file.exists():
	pass # Simple spinlock
	self.lock_file.touch()

	def __exit__(self, exc_type, exc_val, exc_tb):
	self.lock_file.unlink()

	scheduler = SimpleLock()


	#scheduler = CommitScheduler(
	# repo_id="insurance-charge-mlops-logs", # provide a name "insurance-charge-mlops-logs" for the repo_id
	# repo_type="dataset",
	# folder_path=log_folder,
	# path_in_repo="data",
	# every=2
	#)

	# Define the predict function which will take features, convert to dataframe and make predictions using the saved model
	# the functions runs when 'Submit' is clicked or when a API request is made

	def predict(age, bmi, children, sex, smoker, region):
	# Create a DataFrame with the input data
	data = {
	'age': [age],
	'bmi': [bmi],
	'children': [children],
	'sex': [sex],
	'smoker': [smoker],
	'region': [region]
	}
	df = pd.DataFrame(data)
	# Make prediction using the loaded model
	prediction = saved_model.predict(df)


	# While the prediction is made, log both the inputs and outputs to a log file
	# While writing to the log file, ensure that the commit scheduler is locked to avoid parallel
	# access

	# with scheduler.lock:
	with scheduler:
	with log_file.open("a") as f:
	f.write(json.dumps(
	{
	'age': age,
	'bmi': bmi,
	'children': children,
	'sex': sex,
	'smoker': smoker,
	'region': region,
	'prediction': prediction[0]
	}
	))
	f.write("\n")

	return prediction[0]



	# Set up UI components for input and output
	age_input = gr.Number(label="Age")
	bmi_input = gr.Number(label="BMI")
	children_input = gr.Number(label="Children")
	sex_input = gr.Radio(choices=['male', 'female'], label="Sex")
	smoker_input = gr.Radio(choices=['yes', 'no'], label="Smoker")
	region_input = gr.Dropdown(choices=['northeast', 'northwest', 'southeast', 'southwest'], label="Region")

	# Create the gradio interface, make title "HealthyLife Insurance Charge Prediction"
	demo = gr.Interface(
	fn=predict,
	inputs=[age_input, bmi_input, children_input, sex_input, smoker_input, region_input],
	outputs="number",
	title="HealthyLife Insurance Charge Prediction"
	)
	# Launch with a load balancer
	demo.queue()
	demo.launch(share=False, show_error=True)