Spaces:

UVA-MSBA
/

Mod3_Team5

Sleeping

App Files Files Community

Mod3_Team5 / app.py

Mpodszus

Update app.py

4e440e2 verified 4 months ago

raw

history blame contribute delete

6.18 kB

	import pickle
	import pandas as pd
	import shap
	import gradio as gr
	import numpy as np
	import matplotlib.pyplot as plt

	# Load the XGBoost model from Pickle
	loaded_model = pickle.load(open("h22_xgb_Final(2).pkl", 'rb'))

	# Setup SHAP Explainer for XGBoost (Do not change this)
	explainer = shap.Explainer(loaded_model)

	def safe_convert(value, default, min_val, max_val):
	try:
	num = float(value)
	return max(min_val, min(num, max_val)) # Ensure within range
	except (TypeError, ValueError):
	return default # Use default if conversion fails

	# Create the main function for the model
	def main_func(Department, ChainScale, SupportiveGM, Merit, LearningDevelopment, WorkEnvironment, Engagement, WellBeing):


	ChainScale_mapping = {
	'Luxury': 1,
	'Upper Midscale': 2,
	'Upper Upscale': 3,
	'Upscale': 4,
	'Independent': 5,
	}

	department_mapping = {
	"Guest Services": 1,
	"Food and Beverage": 2,
	"Housekeeping": 3,
	"Front Office Operations": 4,
	"Guest Activities": 5,
	}


	LearningDevelopment = safe_convert(LearningDevelopment, 3.0, 1, 5)
	SupportiveGM = safe_convert(SupportiveGM, 3.0, 1, 5)
	Merit = safe_convert(Merit, 3.0, 1, 5)
	WorkEnvironment = safe_convert(WorkEnvironment, 3.0, 1, 5)
	Engagement = safe_convert(Engagement, 3.0, 1, 5)
	WellBeing = safe_convert(WellBeing, 3.0, 1, 5)


	new_row = pd.DataFrame({
	'SupportiveGM': [SupportiveGM],
	'Merit': [Merit],
	'LearningDevelopment': [LearningDevelopment],
	'WorkEnvironment': [WorkEnvironment],
	'Engagement': [Engagement],
	'WellBeing': [WellBeing]
	}).astype(float)

	# Predict probabilities
	prob = loaded_model.predict_proba(new_row)

	if prob.shape[1] == 2:
	leave_prob = float(prob[0][0])
	stay_prob = float(prob[0][1])
	else:
	leave_prob = float(prob[0])
	stay_prob = 1 - leave_prob

	# Generate SHAP values
	shap_values = explainer(new_row)

	fig, ax = plt.subplots(figsize=(8, 4))
	shap.waterfall_plot(shap.Explanation(
	values=shap_values.values[0],
	base_values=shap_values.base_values[0],
	data=new_row.iloc[0]
	))
	plt.tight_layout()
	local_plot = plt.gcf()
	plt.close()

	return {"Leave": leave_prob, "Stay": stay_prob}, local_plot

	# Create the UI
	title = "Mod 3 Team 5: Employee Turnover Predictor & Interpreter"
	description1 = """
	This app evaluates six key factors affecting employee satisfaction—Supportive GM, Merit, Learning & Development, Work Environment, Engagement, and Well-Being—to predict whether an employee is likely to stay with Hilton or leave.
	The app provides two key outputs:

	Predicted Probability
	A likelihood score indicating whether an employee will stay or leave.

	SHAP Force Plot
	A dynamic visualization that illustrates how each factor influences the prediction, helping to pinpoint the most impactful drivers of employee retention.
	Designed for HR teams at both departmental and hotel chain levels, this tool delivers data-driven insights to improve employee experience and retention strategies across Hilton properties.
	"""

	description2 = """
	To use the app, adjust the values of the employee satisfaction factors and click on Analyze.
	"""

	with gr.Blocks(title=title) as demo:
	gr.Markdown(f"## {title}")
	gr.Markdown(description1)
	gr.Markdown("""---""")
	gr.Markdown(description2)
	gr.Markdown("""---""")

	with gr.Row():
	with gr.Column():
	Department = gr.Radio(
	["Guest Services", "Food and Beverage", "Housekeeping", "Front Office Operations", "Guest Activities"],
	label="Department",
	value="Guest Services"
	)
	ChainScale = gr.Dropdown(
	["Luxury", "Upper Midscale", "Upper Upscale", "Upscale", "Independent"],
	label="ChainScale (Example)",
	value="Upper Upscale"
	)
	SupportiveGM = gr.Slider(
	label="SupportiveGM Score", minimum=1, maximum=5, value=4, step=0.1,
	interactive=True
	)
	Merit = gr.Slider(
	label="Merit Score", minimum=1, maximum=5, value=4, step=0.1,
	interactive=True
	)
	LearningDevelopment = gr.Slider(
	label="Learning and Development Score", minimum=1, maximum=5, value=4, step=0.1,
	interactive=True
	)
	WorkEnvironment = gr.Slider(
	label="Work Environment Score", minimum=1, maximum=5, value=4, step=0.1,
	interactive=True
	)
	Engagement = gr.Slider(
	label="Engagement Score", minimum=1, maximum=5, value=4, step=0.1,
	interactive=True
	)
	WellBeing = gr.Slider(
	label="Well-Being Score", minimum=1, maximum=5, value=4, step=0.1,
	interactive=True
	)
	submit_btn = gr.Button("Analyze")

	with gr.Column(visible=True, scale=1, min_width=600) as output_col:
	label = gr.Label(label="Predicted Intent to Stay vs Leave")
	local_plot = gr.Plot(label='SHAP Waterfall Analysis')

	submit_btn.click(
	main_func,
	[Department, ChainScale, SupportiveGM, Merit, LearningDevelopment, WorkEnvironment, Engagement, WellBeing],
	[label, local_plot],
	api_name="Employee_Turnover"
	)

	gr.Markdown("### Click on any of the examples below to see how it works:")

	gr.Examples(
	[
	["Guest Services", "Upper Upscale", 4.1, 3.7, 3.9, 4.2, 4.4, 4.3],
	["Food and Beverage", "Upper Upscale", 3.9, 3.7, 4.1, 4.3, 4.5, 4.4],
	["Housekeeping", "Upper Upscale", 4.3, 4.0, 4.3, 4.4, 4.5, 4.4],
	],
	[Department, ChainScale, SupportiveGM, Merit, LearningDevelopment, WorkEnvironment, Engagement, WellBeing],
	[label, local_plot],
	main_func,
	cache_examples=True
	)
	demo.launch()