import gradio as gr
import xgboost as xgb
import numpy as np
import pandas as pd
import joblib
import os
import warnings
import shap
import matplotlib.pyplot as plt

# Suppress XGBoost warnings
warnings.filterwarnings("ignore", category=UserWarning, message=".*WARNING.*")

# Load your model (automatically detect XGBoost or joblib model)
def load_model():
    model_path = "xgboost_model.json"  # Ensure this matches your file name
    if os.path.exists(model_path):  
        model = xgb.Booster()
        model.load_model(model_path)
        print("✅ Model loaded successfully.")
        return model
    else:
        print("❌ Model file not found.")
        return None

model = load_model()

# Prediction function with consistent feature names
def predict_employee_status(satisfaction_level, last_evaluation, number_project,
                            average_monthly_hours, time_spent_company, 
                            work_accident, promotion_last_5years, salary, department, threshold=0.5):
    
    # One-hot encode the department
    departments = [
        'RandD', 'accounting', 'hr', 'management', 'marketing',
        'product_mng', 'sales', 'support', 'technical'
    ]
    department_features = {f"department_{dept}": 0 for dept in departments}
    if department in departments:
        department_features[f"department_{department}"] = 1

    # Generate Interaction Features
    satisfaction_evaluation = satisfaction_level * last_evaluation
    work_balance = average_monthly_hours / number_project

    # Prepare the input with all expected features
    input_data = {
        "satisfaction_level": [satisfaction_level],
        "last_evaluation": [last_evaluation],
        "number_project": [number_project],
        "average_monthly_hours": [average_monthly_hours],
        "time_spent_company": [time_spent_company],  # Corrected
        "Work_accident": [work_accident],
        "promotion_last_5years": [promotion_last_5years],
        "salary": [salary],
        "satisfaction_evaluation": [satisfaction_evaluation],  # Added
        "work_balance": [work_balance],  # Added
        **department_features
    }

    input_df = pd.DataFrame(input_data)

    # Predict using the model
    if model is None:
        return "❌ No model found. Please upload the model file."

    try:
        dmatrix = xgb.DMatrix(input_df)
        prediction = model.predict(dmatrix)
        prediction_prob = prediction[0]

        # Apply the dynamic threshold
        result = "✅ Employee is likely to quit." if prediction_prob >= threshold else "✅ Employee is likely to stay."
        return f"{result} (Probability: {prediction_prob:.2%})"
    except Exception as e:
        return f"❌ Error: {str(e)}"

# Gradio interface with consistent feature names
def gradio_interface():
    interface = gr.Interface(
        fn=predict_employee_status,
        inputs=[
            gr.Number(label="Satisfaction Level (0.0 - 1.0)"),
            gr.Number(label="Last Evaluation (0.0 - 1.0)"),
            gr.Number(label="Number of Projects (1 - 10)"),
            gr.Number(label="Average Monthly Hours (80 - 320)"),
            gr.Number(label="Time Spent at Company (Years)"),  # Corrected
            gr.Radio([0, 1], label="Work Accident (0 = No, 1 = Yes)"),
            gr.Radio([0, 1], label="Promotion in Last 5 Years (0 = No, 1 = Yes)"),
            gr.Radio([0, 1, 2], label="Salary (0 = Low, 1 = Medium, 2 = High)"),
            gr.Dropdown(
                ['RandD', 'accounting', 'hr', 'management', 'marketing',
                 'product_mng', 'sales', 'support', 'technical'], 
                label="Department"
            ),
            gr.Slider(0.1, 0.9, value=0.5, step=0.05, label="Prediction Threshold")
        ],
        outputs="text",
        title="Employee Retention Prediction System (With SHAP & ROC Threshold)",
        description="Predict whether an employee is likely to stay or quit based on their profile. Adjust the threshold for accurate predictions.",
        theme="dark"
    )
    interface.launch()

gradio_interface()