Ml-Exp-3 - Jupyter Notebook

10/20/24, 10:54 PM ml-exp-3 - Jupyter Notebook
In [1]:  # Importing necessary libraries

import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import accuracy_score, confusion_matrix
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense

# Step 1: Load the dataset
url = '/kaggle/input/bank-customer-churn-modeling/Churn_Modelling.csv'
df = pd.read_csv(url)

# Display the first few rows to check the dataset
df.head()

Out[1]: RowNumber CustomerId Surname CreditScore Geography Gender Age Tenure
0 1 15634602 Hargrave 619 France Female 42 2
1 2 15647311 Hill 608 Spain Female 41 1
2 3 15619304 Onio 502 France Female 42 8
3 4 15701354 Boni 699 France Female 39 1
4 5 15737888 Mitchell 850 Spain Female 43 2
localhost:8888/notebooks/Downloads/ml-exp-3.ipynb 1/6
In [2]:  #STEP 2 Dropping irrelevant columns (CustomerId, Surname) and defining

X = df.drop(columns=['CustomerId', 'Surname', 'Exited']) # Features
y = df['Exited'] # Target

# Handle categorical data using one-hot encoding for 'Geography' and 'G
X = pd.get_dummies(X, drop_first=True)

# Display the processed features
X.head(), y.head()

Out[2]: ( RowNumber CreditScore Age Tenure Balance NumOfProducts Ha

sCrCard \
0 1 619 42 2 0.00 1
1
1 2 608 41 1 83807.86 1
0
2 3 502 42 8 159660.80 3
1
3 4 699 39 1 0.00 2
0
4 5 850 43 2 125510.82 1
1
IsActiveMember EstimatedSalary Geography_Germany Geography_Spa

in \
0 1 101348.88 False Fal
se
1 1 112542.58 False Tr
ue
2 0 113931.57 False Fal
se
3 0 93826.63 False Fal
se
4 1 79084.10 False Tr
ue
Gender_Male
0 False
1 False
2 False
3 False
4 False ,
0 1
1 0
2 1
3 0
4 0
Name: Exited, dtype: int64)
In [3]:  # Step 3: Normalize the feature data

scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Show the normalized data
pd.DataFrame(X_scaled, columns=X.columns).head()

Out[3]: RowNumber CreditScore Age Tenure Balance NumOfProducts HasCrCard
0 -1.731878 -0.326221 0.293517 -1.041760 -1.225848 -0.911583 0.646092
1 -1.731531 -0.440036 0.198164 -1.387538 0.117350 -0.911583 -1.547768
2 -1.731185 -1.536794 0.293517 1.032908 1.333053 2.527057 0.646092
3 -1.730838 0.501521 0.007457 -1.387538 -1.225848 0.807737 -1.547768
4 -1.730492 2.063884 0.388871 -1.041760 0.785728 -0.911583 0.646092
In [4]:  # Step 4: Split the dataset into training and test sets
X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_s

# Display the shapes of training and testing data to verify the split
print(f"X_train shape: {X_train.shape}")
print(f"X_test shape: {X_test.shape}")
print(f"y_train shape: {y_train.shape}")
print(f"y_test shape: {y_test.shape}")

X_train shape: (8000, 12)

X_test shape: (2000, 12)
y_train shape: (8000,)
y_test shape: (2000,)
In [5]:  # Step 5: Build the neural network model

model = Sequential()

# Adding the input layer and first hidden layer
model.add(Dense(units=10, activation='relu', input_dim=X_train.shape[1]

# Adding the second hidden layer
model.add(Dense(units=10, activation='relu'))

# Adding the output layer
model.add(Dense(units=1, activation='sigmoid'))

# Compile the model
model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['a

# Train the model
history = model.fit(X_train, y_train, epochs=20, batch_size=32, validat

# Print training results
history_df = pd.DataFrame(history.history)
history_df[['accuracy', 'val_accuracy']].plot()

Epoch 1/20
/opt/conda/lib/python3.10/site-packages/keras/src/layers/core/dense.p
y:87: UserWarning: Do not pass an ìnput_shape`/ìnput_dim` argument
to a layer. When using Sequential models, prefer using an Ìnput(shap
e)` object as the first layer in the model instead.
super().__init__(activity_regularizer=activity_regularizer, **kwarg
s)
250/250 ━━━━━━━━━━━━━━━━━━━━ 2s 2ms/step - accuracy: 0.6186 - loss:

0.6393 - val_accuracy: 0.8035 - val_loss: 0.4613
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Out[5]: <Axes: >

In [6]:  # Step 6: Evaluate the model

# Predicting the test set results
y_pred = (model.predict(X_test) > 0.5).astype("int32")

# Print accuracy score
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy * 100:.2f}%")

# Print confusion matrix
cm = confusion_matrix(y_test, y_pred)
print("Confusion Matrix:")
print(cm)

63/63 ━━━━━━━━━━━━━━━━━━━━ 0s 2ms/step

Accuracy: 85.70%
Confusion Matrix:
[[1533 74]
[ 212 181]]

Ml-Exp-3 - Jupyter Notebook

Uploaded by

Copyright:

Available Formats

Ml-Exp-3 - Jupyter Notebook

Uploaded by

Document Information

Original Title

Copyright

Available Formats

Share this document

Share or Embed Document

Sharing Options

Did you find this document useful?

Is this content inappropriate?

Copyright:

Available Formats

Ml-Exp-3 - Jupyter Notebook

Uploaded by

Copyright:

Available Formats

10/20/24, 10:54 PM ml-exp-3 - Jupyter Notebook

In [1]:  # Importing necessary libraries

Out[1]: RowNumber CustomerId Surname CreditScore Geography Gender Age Tenure

0 1 15634602 Hargrave 619 France Female 42 2

1 2 15647311 Hill 608 Spain Female 41 1

2 3 15619304 Onio 502 France Female 42 8

3 4 15701354 Boni 699 France Female 39 1

4 5 15737888 Mitchell 850 Spain Female 43 2

In [2]:  #STEP 2 Dropping irrelevant columns (CustomerId, Surname) and defining

Out[2]: ( RowNumber CreditScore Age Tenure Balance NumOfProducts Ha

IsActiveMember EstimatedSalary Geography_Germany Geography_Spa

In [3]:  # Step 3: Normalize the feature data

Out[3]: RowNumber CreditScore Age Tenure Balance NumOfProducts HasCrCard

0 -1.731878 -0.326221 0.293517 -1.041760 -1.225848 -0.911583 0.646092

1 -1.731531 -0.440036 0.198164 -1.387538 0.117350 -0.911583 -1.547768

2 -1.731185 -1.536794 0.293517 1.032908 1.333053 2.527057 0.646092

3 -1.730838 0.501521 0.007457 -1.387538 -1.225848 0.807737 -1.547768

4 -1.730492 2.063884 0.388871 -1.041760 0.785728 -0.911583 0.646092

X_train shape: (8000, 12)

In [5]:  # Step 5: Build the neural network model

250/250 ━━━━━━━━━━━━━━━━━━━━ 2s 2ms/step - accuracy: 0.6186 - loss:

Out[5]: <Axes: >

In [6]:  # Step 6: Evaluate the model

63/63 ━━━━━━━━━━━━━━━━━━━━ 0s 2ms/step

You might also like