erikjacobs commited on
Commit
cc35189
·
verified ·
1 Parent(s): 076c964

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. Dockerfile +7 -9
  2. app.py +57 -70
  3. requirements.txt +1 -8
Dockerfile CHANGED
@@ -1,16 +1,14 @@
 
1
  FROM python:3.9-slim
2
 
3
- # Set the working directory inside the container
4
  WORKDIR /app
5
 
6
- # Copy all files from the current directory to the container's working directory
7
  COPY . .
8
 
9
- # Install dependencies from the requirements file without using cache to reduce image size
10
- RUN pip install --no-cache-dir -r requirements.txt
11
 
12
- # Define the command to start the application using Gunicorn with 4 worker processes
13
- # - `-w 4`: Uses 4 worker processes for handling requests
14
- # - `-b 0.0.0.0:7860`: Binds the server to port 7860 on all network interfaces
15
- # - `app:app`: Runs the Flask app (assuming `app.py` contains the Flask instance named `app`)
16
- CMD ["gunicorn", "-w", "4", "-b", "0.0.0.0:7860", "app:app"]
 
1
+ # Use a minimal base image with Python 3.9 installed
2
  FROM python:3.9-slim
3
 
4
+ # Set the working directory inside the container to /app
5
  WORKDIR /app
6
 
7
+ # Copy all files from the current directory on the host to the container's /app directory
8
  COPY . .
9
 
10
+ # Install Python dependencies listed in requirements.txt
11
+ RUN pip3 install -r requirements.txt
12
 
13
+ # Define the command to run the Streamlit app on port 8501 and make it accessible externally
14
+ CMD ["streamlit", "run", "app.py", "--server.port=8501", "--server.address=0.0.0.0", "--server.enableXsrfProtection=false"]
 
 
 
app.py CHANGED
@@ -1,71 +1,58 @@
1
- import joblib
2
  import pandas as pd
3
- from flask import Flask, request, jsonify
4
-
5
- # Initialize Flask app with a name
6
- app = Flask("Telecom Customer Churn Predictor")
7
-
8
- # Load the trained churn prediction model
9
- model = joblib.load("churn_prediction_model_v1_0.joblib")
10
-
11
- # Define a route for the home page
12
- @app.get('/')
13
- def home():
14
- return "Welcome to the Telecom Customer Churn Prediction API"
15
-
16
- # Define an endpoint to predict churn for a single customer
17
- @app.post('/v1/customer')
18
- def predict_churn():
19
- # Get JSON data from the request
20
- customer_data = request.get_json()
21
-
22
- # Extract relevant customer features from the input data
23
- sample = {
24
- 'SeniorCitizen': customer_data['SeniorCitizen'],
25
- 'Partner': customer_data['Partner'],
26
- 'Dependents': customer_data['Dependents'],
27
- 'tenure': customer_data['tenure'],
28
- 'PhoneService': customer_data['PhoneService'],
29
- 'InternetService': customer_data['InternetService'],
30
- 'Contract': customer_data['Contract'],
31
- 'PaymentMethod': customer_data['PaymentMethod'],
32
- 'MonthlyCharges': customer_data['MonthlyCharges'],
33
- 'TotalCharges': customer_data['TotalCharges']
34
- }
35
-
36
- # Convert the extracted data into a DataFrame
37
- input_data = pd.DataFrame([sample])
38
-
39
- # Make a churn prediction using the trained model
40
- prediction = model.predict(input_data).tolist()[0]
41
-
42
- # Map prediction result to a human-readable label
43
- prediction_label = "churn" if prediction == 1 else "not churn"
44
-
45
- # Return the prediction as a JSON response
46
- return jsonify({'Prediction': prediction_label})
47
-
48
- # Define an endpoint to predict churn for a batch of customers
49
- @app.post('/v1/customerbatch')
50
- def predict_churn_batch():
51
- # Get the uploaded CSV file from the request
52
- file = request.files['file']
53
-
54
- # Read the file into a DataFrame
55
- input_data = pd.read_csv(file)
56
-
57
- # Make predictions for the batch data and convert raw predictions into a readable format
58
- predictions = [
59
- 'Churn' if x == 1
60
- else "Not Churn"
61
- for x in model.predict(input_data.drop("customerID",axis=1)).tolist()
62
- ]
63
-
64
- cust_id_list = input_data.customerID.values.tolist()
65
- output_dict = dict(zip(cust_id_list, predictions))
66
-
67
- return output_dict
68
-
69
- # Run the Flask app in debug mode
70
- if __name__ == '__main__':
71
- app.run(debug=True)
 
1
+ import streamlit as st
2
  import pandas as pd
3
+ import requests
4
+
5
+ # Streamlit UI for Customer Churn Prediction
6
+ st.title("Telecom Customer Churn Prediction App")
7
+ st.write("This tool predicts customer churn risk based on their details. Enter the required information below.")
8
+
9
+ # Collect user input based on dataset columns
10
+ CustomerID = st.number_input("Customer ID", min_value=10000000, max_value=99999999)
11
+ SeniorCitizen = st.selectbox("Senior citizen", ["Yes", "No"])
12
+ Partner = st.selectbox("Does the customer have a partner?", ["Yes", "No"])
13
+ Dependents = st.selectbox("Does the customer have dependents?", ["Yes", "No"])
14
+ PhoneService = st.selectbox("Does the customer have phone service?", ["Yes", "No"])
15
+ InternetService = st.selectbox("Type of Internet Service", ["DSL", "Fiber optic", "No"])
16
+ Contract = st.selectbox("Type of Contract", ["Month-to-month", "One year", "Two year"])
17
+ PaymentMethod = st.selectbox("Payment Method", ["Electronic check", "Mailed check", "Bank transfer", "Credit card"])
18
+ tenure = st.number_input("Tenure (Months with the company)", min_value=0, value=12)
19
+ MonthlyCharges = st.number_input("Monthly Charges", min_value=0.0, value=50.0)
20
+ TotalCharges = st.number_input("Total Charges", min_value=0.0, value=600.0)
21
+
22
+ # Convert categorical inputs to match model training
23
+ customer_data = {
24
+ 'SeniorCitizen': 1 if SeniorCitizen == "Yes" else 0,
25
+ 'Partner':Partner,
26
+ 'Dependents': Dependents,
27
+ 'tenure': tenure,
28
+ 'PhoneService': PhoneService,
29
+ 'InternetService': InternetService,
30
+ 'Contract': Contract,
31
+ 'PaymentMethod': PaymentMethod,
32
+ 'MonthlyCharges': MonthlyCharges,
33
+ 'TotalCharges': TotalCharges
34
+ }
35
+
36
+
37
+ if st.button("Predict", type='primary'):
38
+ response = requests.post("https://<user_name>-<space_name>.hf.space/v1/customer", json=customer_data) # enter user name and space name before running the cell
39
+ if response.status_code == 200:
40
+ result = response.json()
41
+ churn_prediction = result["Prediction"] # Extract only the value
42
+ st.write(f"Based on the information provided, the customer with ID {CustomerID} is likely to {churn_prediction}.")
43
+ else:
44
+ st.error("Error in API request")
45
+
46
+ # Batch Prediction
47
+ st.subheader("Batch Prediction")
48
+
49
+ file = st.file_uploader("Upload CSV file", type=["csv"])
50
+ if file is not None:
51
+ if st.button("Predict for Batch", type='primary'):
52
+ response = requests.post("https://<user_name>-<space_name>.hf.space/v1/customerbatch", files={"file": file}) # enter user name and space name before running the cell
53
+ if response.status_code == 200:
54
+ result = response.json()
55
+ st.header("Batch Prediction Results")
56
+ st.write(result)
57
+ else:
58
+ st.error("Error in API request")
 
 
 
 
 
 
 
 
 
 
 
 
 
requirements.txt CHANGED
@@ -1,10 +1,3 @@
1
  pandas==2.2.2
2
- numpy==2.0.2
3
- scikit-learn==1.6.1
4
- xgboost==2.1.4
5
- joblib==1.4.2
6
- Werkzeug==2.2.2
7
- flask==2.2.2
8
- gunicorn==20.1.0
9
  requests==2.28.1
10
- uvicorn[standard]
 
1
  pandas==2.2.2
 
 
 
 
 
 
 
2
  requests==2.28.1
3
+ streamlit==1.43.2