0% found this document useful (0 votes)

18 views4 pages

Untitled 57

The document outlines a machine learning workflow using various regression models including Recursive Least Squares, Decision Tree, Random Forest, XGBoost, and an Artificial Neural Network (ANN) to predict a target variable from a dataset. It includes data preprocessing steps such as scaling and train-test splitting, model training with hyperparameter tuning using GridSearchCV, and evaluation of model performance using metrics like MSE, MAE, and R² score. Finally, the results are saved to an Excel file for comparison.

Uploaded by

Akash Layek

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

18 views4 pages

Untitled 57

Uploaded by

Akash Layek

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

import pandas as pd

import numpy as np
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.metrics import mean_squared_error, mean_absolute_error,
r2_score
from sklearn.tree import DecisionTreeRegressor
from sklearn.ensemble import RandomForestRegressor
from xgboost import XGBRegressor
from sklearn.preprocessing import StandardScaler

# For ANN
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.wrappers.scikit_learn import KerasRegressor

# Load dataset
df = pd.read_csv("Imbalanced_PV_Fault_Dataset.csv")

X = df.drop(columns=["Feature_0", "Fault_Flag"])
y = df["Feature_0"]

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X, y,
test_size=0.2, random_state=42)

# Scaling
scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

# ----------- Recursive Least Squares -----------

class RecursiveLeastSquares:
def __init__(self, num_features, lambda_factor=0.99, delta=1.0):
self.num_features = num_features
self.lambda_factor = lambda_factor
self.P = np.eye(num_features) * delta
self.theta = np.zeros(num_features)

def update(self, X, y):

X = np.array(X).reshape(-1, 1)
y = np.array(y)
K = self.P @ X / (self.lambda_factor + X.T @ self.P @ X)
self.theta += (y - X.T @ self.theta) * K.flatten()
self.P = (self.P - K @ X.T @ self.P) / self.lambda_factor

rls = RecursiveLeastSquares(num_features=X.shape[1])
for i in range(len(X_train)):
rls.update(X_train.iloc[i].values, y_train.iloc[i])
y_rls_pred = [np.dot(rls.theta, x) for x in X_test.values]
# ----------- GridSearchCV Models -----------

# Decision Tree
dtr = DecisionTreeRegressor(random_state=42)
dtr_param = {'max_depth': [3, 5, 10, None]}
dtr_grid = GridSearchCV(dtr, dtr_param, cv=5)
dtr_grid.fit(X_train, y_train)
dtr_pred = dtr_grid.best_estimator_.predict(X_test)

# Random Forest
rfr = RandomForestRegressor(random_state=42)
rfr_param = {'n_estimators': [50, 100], 'max_depth': [5, 10, None]}
rfr_grid = GridSearchCV(rfr, rfr_param, cv=5)
rfr_grid.fit(X_train, y_train)
rfr_pred = rfr_grid.best_estimator_.predict(X_test)

# XGBoost
xgb = XGBRegressor(random_state=42, verbosity=0)
xgb_param = {'n_estimators': [50, 100], 'max_depth': [3, 5, 10]}
xgb_grid = GridSearchCV(xgb, xgb_param, cv=5)
xgb_grid.fit(X_train, y_train)
xgb_pred = xgb_grid.best_estimator_.predict(X_test)

# ----------- ANN Model -----------

def build_ann():
model = Sequential()
model.add(Dense(64, input_dim=X_train.shape[1],
activation='relu'))
model.add(Dense(32, activation='relu'))
model.add(Dense(1)) # Output layer
model.compile(optimizer='adam', loss='mse')
return model

ann = KerasRegressor(build_fn=build_ann, epochs=100, batch_size=16,

verbose=0)
ann.fit(X_train_scaled, y_train)
ann_pred = ann.predict(X_test_scaled)

/var/folders/tt/9tcd3n611x1_n7ww1jb91r500000gn/T/
ipykernel_27794/2130103562.py:1: DeprecationWarning: KerasRegressor is
deprecated, use Sci-Keras (https://github.com/adriangb/scikeras)
instead. See https://www.adriangb.com/scikeras/stable/migration.html
for help migrating.
ann = KerasRegressor(build_fn=build_ann, epochs=100, batch_size=16,
verbose=0)

# ----------- Metrics -----------

metrics = {
"Model": ["RLS", "Decision Tree", "Random Forest", "XGBoost",
"ANN"],
"MSE": [
mean_squared_error(y_test, y_rls_pred),
mean_squared_error(y_test, dtr_pred),
mean_squared_error(y_test, rfr_pred),
mean_squared_error(y_test, xgb_pred),
mean_squared_error(y_test, ann_pred),
],
"MAE": [
mean_absolute_error(y_test, y_rls_pred),
mean_absolute_error(y_test, dtr_pred),
mean_absolute_error(y_test, rfr_pred),
mean_absolute_error(y_test, xgb_pred),
mean_absolute_error(y_test, ann_pred),
],
"R² Score": [
r2_score(y_test, y_rls_pred),
r2_score(y_test, dtr_pred),
r2_score(y_test, rfr_pred),
r2_score(y_test, xgb_pred),
r2_score(y_test, ann_pred),
]
}

comparison_df = pd.DataFrame(metrics)
print(comparison_df)

# Optional: print best parameters

print("\nBest Parameters:")
print("DTR:", dtr_grid.best_params_)
print("RFR:", rfr_grid.best_params_)
print("XGB:", xgb_grid.best_params_)

Model MSE MAE R² Score

0 RLS 4.525742e-26 1.691223e-13 1.000000
1 Decision Tree 1.820721e-01 3.104887e-01 0.921079
2 Random Forest 6.800423e-02 1.663037e-01 0.970523
3 XGBoost 4.184689e-02 1.506359e-01 0.981861
4 ANN 2.230879e-04 1.038437e-02 0.999903

Best Parameters:
DTR: {'max_depth': None}
RFR: {'max_depth': None, 'n_estimators': 100}
XGB: {'max_depth': 3, 'n_estimators': 100}

import pandas as pd

# Assuming `comparison_df` already exists from previous code

# and contains columns: "Model", "MSE", "MAE", "R² Score"

# Define output file name

output_file = "comparison_report.xlsx"
# Save to Excel
comparison_df.to_excel(output_file, index=False)

print(f"Comparison report saved as '{output_file}' in your current

working directory.")

Comparison report saved as 'comparison_report.xlsx' in your current

working directory.

Multiple Choice Test Bank Questions No Feedback - Chapter 1
No ratings yet
Multiple Choice Test Bank Questions No Feedback - Chapter 1
47 pages
Mercedes-Benz Greener Manufacturing Ai
0% (1)
Mercedes-Benz Greener Manufacturing Ai
16 pages
Reference Book
No ratings yet
Reference Book
3 pages
Supple Maximizing Performance in Cs CuBiCl
No ratings yet
Supple Maximizing Performance in Cs CuBiCl
5 pages
To Improve The Performance of Models Predicting Ba
No ratings yet
To Improve The Performance of Models Predicting Ba
6 pages
Grid
No ratings yet
Grid
2 pages
AML Code For m2
No ratings yet
AML Code For m2
7 pages
ML Lab-1
No ratings yet
ML Lab-1
32 pages
COMPARISON - Jupyter Notebook
No ratings yet
COMPARISON - Jupyter Notebook
5 pages
Machine Learning Cheat Sheet
No ratings yet
Machine Learning Cheat Sheet
15 pages
5) Randomforest - Ipynb - Colaboratory
No ratings yet
5) Randomforest - Ipynb - Colaboratory
12 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
Decision Tree Algorithm in Machine Learning
No ratings yet
Decision Tree Algorithm in Machine Learning
13 pages
ML5&6&7&8&9&10
No ratings yet
ML5&6&7&8&9&10
35 pages
ML Functions
No ratings yet
ML Functions
12 pages
Experiment 2 FDL - Jupyter Notebook
No ratings yet
Experiment 2 FDL - Jupyter Notebook
2 pages
FB Models PDF
No ratings yet
FB Models PDF
14 pages
ML Codes
No ratings yet
ML Codes
9 pages
ML LAB
No ratings yet
ML LAB
29 pages
Assgn 06 ML.ipynb - Colab
No ratings yet
Assgn 06 ML.ipynb - Colab
5 pages
Hyperparameter Tuning
No ratings yet
Hyperparameter Tuning
7 pages
AIML Project
No ratings yet
AIML Project
4 pages
Classification Review
No ratings yet
Classification Review
8 pages
Smart Factory Energy Prediction - Ipynb
No ratings yet
Smart Factory Energy Prediction - Ipynb
355 pages
Models
No ratings yet
Models
2 pages
Time Series Forecasting Basic Eda Prediction
No ratings yet
Time Series Forecasting Basic Eda Prediction
4 pages
Slip
No ratings yet
Slip
5 pages
Zerox Ready
No ratings yet
Zerox Ready
21 pages
AIH Lab2
No ratings yet
AIH Lab2
10 pages
ML Lab File Final
No ratings yet
ML Lab File Final
17 pages
Car Mock - ML Ans
No ratings yet
Car Mock - ML Ans
6 pages
ML Fat
No ratings yet
ML Fat
9 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Ai Int-1
No ratings yet
Ai Int-1
6 pages
Import Numpy As NP Import Pandas As PD
No ratings yet
Import Numpy As NP Import Pandas As PD
7 pages
Heart Disease 50% Code
No ratings yet
Heart Disease 50% Code
3 pages
Forest - Py
No ratings yet
Forest - Py
50 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
ML Using Python Programs
No ratings yet
ML Using Python Programs
12 pages
Task 4
No ratings yet
Task 4
2 pages
Random Forest: Implementaciones de Scikit-Learn Sobre QSAR
100% (1)
Random Forest: Implementaciones de Scikit-Learn Sobre QSAR
11 pages
ML Lab Programs 2
No ratings yet
ML Lab Programs 2
16 pages
1
No ratings yet
1
13 pages
ML Assignment
No ratings yet
ML Assignment
10 pages
QB 1
No ratings yet
QB 1
11 pages
S 10
No ratings yet
S 10
11 pages
Project
No ratings yet
Project
16 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Homework: Grid Search For Hyperparameter Tuning: From Sklearn - Model - Selection Import Train - Test - Split
No ratings yet
Homework: Grid Search For Hyperparameter Tuning: From Sklearn - Model - Selection Import Train - Test - Split
9 pages
Import Library Python
No ratings yet
Import Library Python
10 pages
Loan ML Complete Guide
No ratings yet
Loan ML Complete Guide
3 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
Hyperparameter Tuning
No ratings yet
Hyperparameter Tuning
9 pages
AI 28-01-25
No ratings yet
AI 28-01-25
18 pages
Sentimental
No ratings yet
Sentimental
11 pages
Hyperparameter Tuning Mits
No ratings yet
Hyperparameter Tuning Mits
17 pages
ML Cheat Sheet
No ratings yet
ML Cheat Sheet
7 pages
21brs1474 ML Lab 2
No ratings yet
21brs1474 ML Lab 2
25 pages
Codigo Modelo
No ratings yet
Codigo Modelo
5 pages
8 To 12 Jaimeen
No ratings yet
8 To 12 Jaimeen
34 pages
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
Lec5 CostBehavior
No ratings yet
Lec5 CostBehavior
23 pages
Efficient Bayesian Inference For AFRIMA Processes
No ratings yet
Efficient Bayesian Inference For AFRIMA Processes
33 pages
Coupon Collector
No ratings yet
Coupon Collector
16 pages
Ma 1 Sem Research Methodology p3 Winter 2018
No ratings yet
Ma 1 Sem Research Methodology p3 Winter 2018
6 pages
Presentation - Retail Sales Prediction
No ratings yet
Presentation - Retail Sales Prediction
23 pages
2019-A New Semiparametric Weibull Cure Rate Model Fitting Different Behaviors Within GAMLSS
No ratings yet
2019-A New Semiparametric Weibull Cure Rate Model Fitting Different Behaviors Within GAMLSS
18 pages
Statistics Assignment
No ratings yet
Statistics Assignment
11 pages
Reliability: Case Processing Summary
No ratings yet
Reliability: Case Processing Summary
2 pages
Chapter Three: Estimation of Multiple Linear Regression Model
No ratings yet
Chapter Three: Estimation of Multiple Linear Regression Model
18 pages
Econometric Theory: Module - Ii
No ratings yet
Econometric Theory: Module - Ii
8 pages
Correlation and Chi-Square Test - LDR 280
100% (1)
Correlation and Chi-Square Test - LDR 280
71 pages
Two-Way Anova Using SPSS
No ratings yet
Two-Way Anova Using SPSS
13 pages
Submitted By: Syeda Fizza Raza Naqvi (MBA192005) Answer 1
No ratings yet
Submitted By: Syeda Fizza Raza Naqvi (MBA192005) Answer 1
2 pages
Worksheet No. 1-Random Variable
No ratings yet
Worksheet No. 1-Random Variable
3 pages
STAT201 Probability Theory and Applications (1410) - Kwong Koon Shing
No ratings yet
STAT201 Probability Theory and Applications (1410) - Kwong Koon Shing
2 pages
GEED 10053 - Lesson 4.4 To 4.5
No ratings yet
GEED 10053 - Lesson 4.4 To 4.5
71 pages
Modeling Basketball's Points Per Possession With Application To Predicting The Outcome of College Basketball Games
No ratings yet
Modeling Basketball's Points Per Possession With Application To Predicting The Outcome of College Basketball Games
19 pages
SML Book Draft Latest (001 046)
No ratings yet
SML Book Draft Latest (001 046)
46 pages
Cf01 Tut Sol
No ratings yet
Cf01 Tut Sol
5 pages
Yulu Case Study
No ratings yet
Yulu Case Study
1 page
MA8402 Probability and Queueing MCQ
No ratings yet
MA8402 Probability and Queueing MCQ
18 pages
Logistic Regression
No ratings yet
Logistic Regression
49 pages
Work Sheet For Final Exam
No ratings yet
Work Sheet For Final Exam
4 pages
Chapter 3
No ratings yet
Chapter 3
2 pages
6 - CFA-SEM Intro - 4-18-11
100% (1)
6 - CFA-SEM Intro - 4-18-11
94 pages
Rebound Hammer Summary
No ratings yet
Rebound Hammer Summary
39 pages
Stastics Question
No ratings yet
Stastics Question
7 pages
Chapter 7
No ratings yet
Chapter 7
63 pages

Untitled 57

Uploaded by

Untitled 57

Uploaded by

import pandas as pd

# ----------- Recursive Least Squares -----------

def update(self, X, y):

# ----------- ANN Model -----------

ann = KerasRegressor(build_fn=build_ann, epochs=100, batch_size=16,

# ----------- Metrics -----------

# Optional: print best parameters

Model MSE MAE R² Score

# Assuming `comparison_df` already exists from previous code

# Define output file name

print(f"Comparison report saved as '{output_file}' in your current

Comparison report saved as 'comparison_report.xlsx' in your current

You might also like