-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathapp.py
More file actions
76 lines (59 loc) · 2.13 KB
/
app.py
File metadata and controls
76 lines (59 loc) · 2.13 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
import streamlit as st
import numpy as np
import tensorflow as tf
from tensorflow.keras.models import load_model
from sklearn.preprocessing import StandardScaler, LabelEncoder, OneHotEncoder
import pandas as pd
import pickle
## Load the trained model
model = load_model('model.h5')
## load encoders and scales
with open('label_encoder_gender.pkl', 'rb') as file:
label_encoder_gender = pickle.load(file)
with open('ohe_geo.pkl', 'rb') as file:
ohe_geo = pickle.load(file)
with open('scaler.pkl', 'rb') as file:
scaler = pickle.load(file)
## streamlit app
st.title('Customer churn prediction')
# User input
geography = st.selectbox('Geography', ohe_geo.categories_[0])
gender = st.selectbox('Gender', label_encoder_gender.classes_)
age = st.slider('Age', 18, 92)
balance = st.number_input('Balance')
credit_score = st.number_input('Credit Score')
estimated_salary = st.number_input('Estimated Salary')
tenure = st.slider('Tenure', 0, 10)
num_of_products = st.slider('Number of Products', 1, 4)
has_cr_card = st.selectbox('Has Credit Card', [0, 1])
is_active_member = st.selectbox('Is Active Member', [0, 1])
# Prepare the input data
input_data = pd.DataFrame({
'CreditScore': [credit_score],
'Gender': [label_encoder_gender.transform([gender])[0]],
'Age': [age],
'Tenure': [tenure],
'Balance': [balance],
'NumOfProducts': [num_of_products],
'HasCrCard': [has_cr_card],
'IsActiveMember': [is_active_member],
'EstimatedSalary': [estimated_salary]
})
geo_encoded = ohe_geo.transform([[geography]]).toarray()
geo_encoded_df = pd.DataFrame(
geo_encoded,
columns=ohe_geo.get_feature_names_out((['Geography']))
)
input_data = pd.concat(
[input_data.reset_index(drop=True),
geo_encoded_df],
axis=1
)
input_data_scaled = scaler.transform(input_data)
predictions = model.predict(input_data_scaled)
predictions_proba = predictions[0][0]
st.write(f'churn probability: {predictions_proba:.2f}')
if predictions_proba > 0.5:
st.write("The customer is likely to churn.")
else:
st.write("The customer is not likely to churn.")