Spaces:

VrundavGamit
/

containerization_case_study

Running

App Files Files Community

VrundavGamit commited on 5 days ago

Commit

d493b2a

verified ·

1 Parent(s): b9a2453

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

Dockerfile +9 -10
app.py +69 -55
requirements.txt +8 -1

Dockerfile CHANGED Viewed

@@ -1,17 +1,16 @@
-# Use a minimal base image with Python 3.9 installed
 FROM python:3.9-slim
-# FROM python:3.13-slim
-# Set the working directory inside the container to /app
 WORKDIR /app
-# Copy all files from the current directory on the host to the container's /app directory
 COPY . .
-# Install Python dependencies listed in requirements.txt
-RUN pip3 install -r requirements.txt
-# Define the command to run the Streamlit app on port 8501 and make it accessible externally
-CMD ["streamlit", "run", "app.py", "--server.port=8501", "--server.address=0.0.0.0", "--server.enableXsrfProtection=false"]
-# NOTE: Disable XSRF protection for easier external access in order to make batch predictions

 FROM python:3.9-slim
+# Set the working directory inside the container
 WORKDIR /app
+# Copy all files from the current directory to the container's working directory
 COPY . .
+# Install dependencies from the requirements file without using cache to reduce image size
+RUN pip install --no-cache-dir -r requirements.txt
+# Define the command to start the application using Gunicorn with 4 worker processes
+# - `-w 4`: Uses 4 worker processes for handling requests
+# - `-b 0.0.0.0:7860`: Binds the server to port 7860 on all network interfaces
+# - `app:app`: Runs the Flask app (assuming `app.py` contains the Flask instance named `app`)
+CMD ["gunicorn", "-w", "4", "-b", "0.0.0.0:7860", "app:app"]

app.py CHANGED Viewed

@@ -1,57 +1,71 @@
-import requests
-import streamlit as st
 import pandas as pd
-st.title("Customer Churn Prediction")
-# Batch Prediction
-st.subheader("Online Prediction")
-# Input fields for customer data
-CustomerID = st.number_input("Customer ID", min_value=10000000, max_value=99999999)
-CreditScore = st.number_input("Credit Score (customer's credit score)", min_value=300, max_value=900, value=650)
-Geography = st.selectbox("Geography (country where the customer resides)", ["France", "Germany", "Spain"])
-Age = st.number_input("Age (customer's age in years)", min_value=18, max_value=100, value=30)
-Tenure = st.number_input("Tenure (number of years the customer has been with the bank)", value=12)
-Balance = st.number_input("Account Balance (customer’s account balance)", min_value=0.0, value=10000.0)
-NumOfProducts = st.number_input("Number of Products (number of products the customer has with the bank)", min_value=1, value=1)
-HasCrCard = st.selectbox("Has Credit Card?", ["Yes", "No"])
-IsActiveMember = st.selectbox("Is Active Member?", ["Yes", "No"])
-EstimatedSalary = st.number_input("Estimated Salary (customer’s estimated salary)", min_value=0.0, value=50000.0)
-customer_data = {
-    'CreditScore': CreditScore,
-    'Geography': Geography,
-    'Age': Age,
-    'Tenure': Tenure,
-    'Balance': Balance,
-    'NumOfProducts': NumOfProducts,
-    'HasCrCard': 1 if HasCrCard == "Yes" else 0,
-    'IsActiveMember': 1 if IsActiveMember == "Yes" else 0,
-    'EstimatedSalary': EstimatedSalary
-}
-username_ns = 'VrundavGamit-containerization_case_study'
-if st.button("Predict", type='primary'):
-    response = requests.post("https://{username_ns}.hf.space/v1/customer", json=customer_data)    # enter user name and space name before running the cell
-    if response.status_code == 200:
-        result = response.json()
-        churn_prediction = result["Prediction"]  # Extract only the value
-        st.write(f"Based on the information provided, the customer with ID {CustomerID} is likely to {churn_prediction}.")
-    else:
-        st.error("Error in API request")
-# Batch Prediction
-st.subheader("Batch Prediction")
-file = st.file_uploader("Upload CSV file", type=["csv"])
-if file is not None:
-    if st.button("Predict for Batch", type='primary'):
-        response = requests.post("https://{username_ns}.hf.space/v1/customerbatch", files={"file": file})    # enter user name and space name before running the cell
-        if response.status_code == 200:
-            result = response.json()
-            st.header("Batch Prediction Results")
-            st.write(result)
-        else:
-            st.error("Error in API request")

+import joblib
 import pandas as pd
+from flask import Flask, request, jsonify
+# Initialize Flask app with a name
+app = Flask("Telecom Customer Churn Predictor")
+# Load the trained churn prediction model
+model = joblib.load("churn_prediction_model_v1_0.joblib")
+# Define a route for the home page
+@app.get('/')
+def home():
+    return "Welcome to the Telecom Customer Churn Prediction API"
+# Define an endpoint to predict churn for a single customer
+@app.post('/v1/customer')
+def predict_churn():
+    # Get JSON data from the request
+    customer_data = request.get_json()
+    # Extract relevant customer features from the input data
+    sample = {
+        'SeniorCitizen': customer_data['SeniorCitizen'],
+        'Partner': customer_data['Partner'],
+        'Dependents': customer_data['Dependents'],
+        'tenure': customer_data['tenure'],
+        'PhoneService': customer_data['PhoneService'],
+        'InternetService': customer_data['InternetService'],
+        'Contract': customer_data['Contract'],
+        'PaymentMethod': customer_data['PaymentMethod'],
+        'MonthlyCharges': customer_data['MonthlyCharges'],
+        'TotalCharges': customer_data['TotalCharges']
+    }
+    # Convert the extracted data into a DataFrame
+    input_data = pd.DataFrame([sample])
+    # Make a churn prediction using the trained model
+    prediction = model.predict(input_data).tolist()[0]
+    # Map prediction result to a human-readable label
+    prediction_label = "churn" if prediction == 1 else "not churn"
+    # Return the prediction as a JSON response
+    return jsonify({'Prediction': prediction_label})
+# Define an endpoint to predict churn for a batch of customers
+@app.post('/v1/customerbatch')
+def predict_churn_batch():
+    # Get the uploaded CSV file from the request
+    file = request.files['file']
+    # Read the file into a DataFrame
+    input_data = pd.read_csv(file)
+    # Make predictions for the batch data and convert raw predictions into a readable format
+    predictions = [
+        'Churn' if x == 1
+        else "Not Churn"
+        for x in model.predict(input_data.drop("customerID",axis=1)).tolist()
+    ]
+    cust_id_list = input_data.customerID.values.tolist()
+    output_dict = dict(zip(cust_id_list, predictions))
+    return output_dict
+# Run the Flask app in debug mode
+if __name__ == '__main__':
+    app.run(debug=True)

requirements.txt CHANGED Viewed

@@ -1,3 +1,10 @@
 pandas==2.2.2
 requests==2.28.1
-streamlit==1.43.2

 pandas==2.2.2
+numpy==2.0.2
+scikit-learn==1.6.1
+xgboost==2.1.4
+joblib==1.4.2
+Werkzeug==2.2.2
+flask==2.2.2
+gunicorn==20.1.0
 requests==2.28.1
+uvicorn[standard]