0% found this document useful (0 votes)

10 views6 pages

HW4ML Project Starter Code Template

The document provides code templates for evaluating and profiling machine learning models using TensorFlow, specifically for the Fashion MNIST and CIFAR-10 datasets. It includes functions for model creation, dataset preparation, evaluation, and quantization to INT8 format, along with profiling for inference latency. Additionally, it emphasizes the importance of ensuring code correctness and discusses the impact of model pruning and compression on performance metrics.

Uploaded by

Amal

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

10 views6 pages

HW4ML Project Starter Code Template

Uploaded by

Amal

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 6

Accuracy, Parameters Count, Training Time (s), Inference Latency (ms).

Accuracy/Parameters Count, Accuracy/Training Time

Writing a bonus paragraph about pruning % and compression impact?

Phase-1 code starter template

The below code is for your reference; please feel free to change it partially or
fully.

Please make sure it does not have any bugs or mistakes. Code authors DO NOT claim
the code is bug-free. It is the student's responsibility to ensure its correctness.

import tensorflow as tf
from tensorflow.keras import layers, models
from tensorflow.keras.datasets import fashion_mnist, cifar10
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.callbacks import EarlyStopping
import time
import numpy as np
from tqdm import tqdm

def create_base_model(input_shape, num_classes):

model = models.Sequential([
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Flatten(),
layers.Dense(2, activation='relu'),
layers.Dense(num_classes, activation='softmax')
])
model.compile(optimizer='adam',
loss='categorical_crossentropy',
metrics=['accuracy'])
return model

def prepare_dataset(dataset_name):
if dataset_name == 'fashion_mnist':
(x_train, y_train), (x_test, y_test) = fashion_mnist.load_data()
num_classes = 10
input_shape = (28, 28, 1)
x_train = x_train.reshape(-1, 28, 28, 1)
x_test = x_test.reshape(-1, 28, 28, 1)
elif dataset_name == 'cifar10':
(x_train, y_train), (x_test, y_test) = cifar10.load_data()
num_classes = 10
input_shape = (32, 32, 3)
else:
raise ValueError(f"Unsupported dataset: {dataset_name}")

x_train = x_train.astype('float32') / 255

x_test = x_test.astype('float32') / 255
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(dataset_name, max_epoch, device):

(x_train, y_train), (x_test, y_test), input_shape, num_classes =
prepare_dataset(dataset_name)

with tf.device(device):
model = create_base_model(input_shape, num_classes)
early_stop = EarlyStopping(monitor='val_loss', patience=3,
restore_best_weights=True)
start_time = time.time()
model.fit(x_train, y_train, epochs=max_epoch, batch_size=64,
validation_split=0.2,
callbacks=[early_stop], verbose=1)
train_time = time.time() - start_time

start_time = time.time()
test_loss, test_accuracy = model.evaluate(x_test, y_test, verbose=0)
eval_time = time.time() - start_time

num_param = model.count_params() # counting number of model's

parameters

print(f"{dataset_name.upper()} Test Accuracy: {test_accuracy * 100:.2f}

%")
print(f"{dataset_name.upper()} Number of Parameters: {num_param}")

return model, num_param, x_test, test_accuracy, train_time, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

print(f"Profiling on {dev_name}...")
latencies = []
with tf.device(device):
for _ in tqdm(range(10), desc="Warm-up..."):
start = time.time()
_ = model(image, training=False)
for _ in tqdm(range(iterations), desc="Profiling"):
start = time.time()
_ = model(image, training=False)
latencies.append((time.time() - start) * 1000)

avg_latency = np.mean(latencies)
print(f"Average Latency on {dev_name}: {avg_latency:.2f} ms")

prediction = model(image, training=False)

predicted_class = tf.argmax(prediction, axis=1).numpy()[0]
print(f"Predicted Class: {predicted_class}")
return avg_latency

# Device priority: CUDA > MPS > CPU

if tf.config.list_physical_devices('GPU'):
device = '/GPU:0'
dev_name = 'GPU'
elif tf.config.list_physical_devices('MPS'):
device = '/MPS:0'
dev_name = 'Apple MPS'
else:
device = '/CPU:0'
dev_name = 'CPU'
print(f'using {dev_name}')
datasets = ['fashion_mnist', 'cifar10']
for dataset in datasets:
print(f"\nProcessing {dataset}...")
model, num_param, x_test, acc, train_t, eval_t = evaluate_model(dataset,
max_epoch=25, device=device)
test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)
profile_workload(model, device, dev_name, test_image)

Phase-3 code starter template

The below code is for your reference; please feel free to change it partially or
fully.

Please make sure it does not have any bugs or mistakes. Code authors DO NOT claim
the code is bug-free. It is the student's responsibility to ensure its correctness.

assert tf.version=='2.15.0', 'WARNING!!! different TensorFlow version may

produce an error while quantizing.'

def create_base_model(input_shape, num_classes):

model = models.Sequential([
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Flatten(),
layers.Dense(2, activation='relu'),
layers.Dense(num_classes, activation='softmax')
])
model.compile(optimizer='adam',
loss='categorical_crossentropy',
metrics=['accuracy'])
return model

x_train = x_train.astype('float32') / 255

x_test = x_test.astype('float32') / 255
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(model, x_test, y_test, device):

with tf.device(device):
start_time = time.time()
loss, acc = model.evaluate(x_test, y_test, verbose=0)
eval_time = time.time() - start_time
return acc, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

print(f"Profiling on {dev_name}...")
latencies = []
with tf.device(device):
for _ in tqdm(range(10), desc="Warm-up"):
_ = model(image, training=False)
for _ in tqdm(range(iterations), desc="Profiling"):
start = time.time()
_ = model(image, training=False)
latencies.append((time.time() - start) * 1000)

avg_latency = np.mean(latencies)
print(f"Average Latency on {dev_name}: {avg_latency:.2f} ms")
return avg_latency

def profile_tflite_model(interpreter, input_tensor, iterations=30):

input_details = interpreter.get_input_details()
output_details = interpreter.get_output_details()
latencies = []

for _ in range(10):
interpreter.set_tensor(input_details[0]['index'], input_tensor)
interpreter.invoke()

for _ in range(iterations):
start = time.time()
interpreter.set_tensor(input_details[0]['index'], input_tensor)
interpreter.invoke()
latencies.append((time.time() - start) * 1000)

avg_latency = np.mean(latencies)
return avg_latency

def quantize_model_to_int8(model, representative_data_gen,

save_path="model_int8.tflite"):
converter = tf.lite.TFLiteConverter.from_keras_model(model)
converter.optimizations = [tf.lite.Optimize.DEFAULT]
converter.representative_dataset = representative_data_gen
converter.target_spec.supported_ops = [tf.lite.OpsSet.TFLITE_BUILTINS_INT8]
converter.inference_input_type = tf.int8
converter.inference_output_type = tf.int8

tflite_quant_model = converter.convert()
with open(save_path, "wb") as f:
f.write(tflite_quant_model)

print(f"INT8 Quantized model saved at {save_path}")

def get_file_size(file_path):
return os.path.getsize(file_path) / 1024 # KB

def evaluate_tflite_accuracy(tflite_model_path, x_test, y_test):

interpreter = tf.lite.Interpreter(model_path=tflite_model_path)
interpreter.allocate_tensors()

input_details = interpreter.get_input_details()
output_details = interpreter.get_output_details()

correct = 0
total = x_test.shape[0]
for i in range(total):
input_data = np.round(x_test[i:i+1] * 255).astype(np.int8) # <- FIXED
interpreter.set_tensor(input_details[0]['index'], input_data)
interpreter.invoke()
output = interpreter.get_tensor(output_details[0]['index'])
if np.argmax(output) == np.argmax(y_test[i]):
correct += 1
accuracy = correct / total
return accuracy

# -------------------
# Main Code
# -------------------
if tf.config.list_physical_devices('GPU'):
device = '/GPU:0'
dev_name = 'GPU'
elif tf.config.list_physical_devices('MPS'):
device = '/MPS:0'
dev_name = 'Apple MPS'
else:
device = '/CPU:0'
dev_name = 'CPU'
print(f'Using {dev_name}')

datasets = ['fashion_mnist', 'cifar10']

for dataset in datasets:

print(f"\nProcessing {dataset}...")

(x_train, y_train), (x_test, y_test), input_shape, num_classes =

prepare_dataset(dataset)

with tf.device(device):
model = create_base_model(input_shape, num_classes)

early_stop = EarlyStopping(monitor='val_loss', patience=3,

restore_best_weights=True)
start_train = time.time()
model.fit(x_train, y_train, epochs=25, batch_size=64,
validation_split=0.2,
callbacks=[early_stop], verbose=1)
train_time = time.time() - start_train

test_acc_fp32, eval_time_fp32 = evaluate_model(model, x_test, y_test,

device)
num_params = model.count_params()

test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)

orig_latency = profile_workload(model, device, dev_name, test_image)

# Save original model

model.save('model_fp32.h5')
fp32_size = get_file_size('model_fp32.h5')
print(f"Original Model Size: {fp32_size:.2f} KB")

# Quantization
def representative_data_gen():
for input_value in
tf.data.Dataset.from_tensor_slices(x_test).batch(1).take(100):
yield [tf.cast(input_value * 255.0, tf.float32)]

quantize_model_to_int8(model, representative_data_gen,
save_path="model_int8.tflite")
int8_size = get_file_size("model_int8.tflite")
print(f"Quantized Model Size: {int8_size:.2f} KB")

# Accuracy after quantization

test_acc_int8 = evaluate_tflite_accuracy("model_int8.tflite", x_test,
y_test)

# Inference latency after quantization

interpreter = tf.lite.Interpreter(model_path="model_int8.tflite")
interpreter.allocate_tensors()
input_details = interpreter.get_input_details()
test_image_int8 = np.round(x_test[:1] * 255).astype(np.int8)
int8_latency = profile_tflite_model(interpreter, test_image_int8)

print("\nSummary:")
print(f"{'Metric':<25} {'Before Quantization':<20} {'After Quantization'}")
print(f"{'-'*70}")
print(f"{'Number of Parameters':<25} {num_params:<20} {num_params}")
print(f"{'Test Accuracy (%)':<25} {test_acc_fp32*100:.2f}%{'':<12}
{test_acc_int8*100:.2f}%")
print(f"{'Training Time (s)':<25} {train_time:.2f}{'':<16} {'-'}")
print(f"{'Evaluation Time (s)':<25} {eval_time_fp32:.4f}{'':<14} {'-'}")
print(f"{'Inference Latency (ms)':<25} {orig_latency:.2f}{'':<14}
{int8_latency:.2f}")
print(f"{'Model Size (KB)':<25} {fp32_size:.2f}{'':<14} {int8_size:.2f}")

Distributed Database Concepts
No ratings yet
Distributed Database Concepts
35 pages
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
No ratings yet
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
39 pages
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
No ratings yet
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
49 pages
HW4ML Project Code
No ratings yet
HW4ML Project Code
24 pages
Deep Learning Practical
No ratings yet
Deep Learning Practical
12 pages
Raw Nitex
No ratings yet
Raw Nitex
5 pages
CVcode
No ratings yet
CVcode
4 pages
Exp. No.: I. Aim: AIML634P Neural Network Lab 2262034
No ratings yet
Exp. No.: I. Aim: AIML634P Neural Network Lab 2262034
6 pages
This Python Script Implements A Single
No ratings yet
This Python Script Implements A Single
6 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
Final Code
No ratings yet
Final Code
16 pages
CNN TF Keras
No ratings yet
CNN TF Keras
6 pages
Deep Learning
No ratings yet
Deep Learning
30 pages
Practical 2: Amtics Enrollment No: 202203103510493
No ratings yet
Practical 2: Amtics Enrollment No: 202203103510493
6 pages
Deep Learning
No ratings yet
Deep Learning
46 pages
DL Practical 6,7 Outputs
No ratings yet
DL Practical 6,7 Outputs
9 pages
Apex For Bres 1
No ratings yet
Apex For Bres 1
6 pages
Deep Learning Lab With Output
No ratings yet
Deep Learning Lab With Output
12 pages
Neural DEEP
No ratings yet
Neural DEEP
39 pages
Lab Manual
No ratings yet
Lab Manual
45 pages
Hand Written
No ratings yet
Hand Written
13 pages
Deep Learning Lab Manual
No ratings yet
Deep Learning Lab Manual
11 pages
MNIST Tensorflow Mini Project 1749471354
No ratings yet
MNIST Tensorflow Mini Project 1749471354
4 pages
DL 1
No ratings yet
DL 1
3 pages
DL 3 Ks
No ratings yet
DL 3 Ks
6 pages
Skill 7
No ratings yet
Skill 7
11 pages
Nndlmac
No ratings yet
Nndlmac
9 pages
CSE488 - Lab8 - TensorFlow II
No ratings yet
CSE488 - Lab8 - TensorFlow II
9 pages
DL Exps
No ratings yet
DL Exps
9 pages
VGG16 Estudo
No ratings yet
VGG16 Estudo
10 pages
Nndlrepo 2
No ratings yet
Nndlrepo 2
3 pages
Handwritten Digit Recognition Using A Neural Network
No ratings yet
Handwritten Digit Recognition Using A Neural Network
4 pages
1729492946538
No ratings yet
1729492946538
10 pages
Brain Tumour Classification
No ratings yet
Brain Tumour Classification
10 pages
Deep Learning Practical File
No ratings yet
Deep Learning Practical File
36 pages
Deep Learning Programs Updated
No ratings yet
Deep Learning Programs Updated
24 pages
Python Deep Learning Lab Programs
No ratings yet
Python Deep Learning Lab Programs
35 pages
DL Practical 3
No ratings yet
DL Practical 3
5 pages
DL Programs
No ratings yet
DL Programs
12 pages
Neural Network
No ratings yet
Neural Network
10 pages
TMA01 Question 1 (45 Marks)
No ratings yet
TMA01 Question 1 (45 Marks)
31 pages
A3 - Jupyter Notebook PDF
No ratings yet
A3 - Jupyter Notebook PDF
5 pages
NNDL Lab Record
No ratings yet
NNDL Lab Record
26 pages
Quality Testing MobileNet V2 Compressed
No ratings yet
Quality Testing MobileNet V2 Compressed
13 pages
Applied Machine and Deep Learning
No ratings yet
Applied Machine and Deep Learning
34 pages
Ass 3
No ratings yet
Ass 3
5 pages
ANN Detection Technique
No ratings yet
ANN Detection Technique
20 pages
DL Prac03IT
No ratings yet
DL Prac03IT
7 pages
(23mca24) Practical 1 & Practical 2
No ratings yet
(23mca24) Practical 1 & Practical 2
6 pages
NNDL 2
No ratings yet
NNDL 2
67 pages
Introduction To ANN With Steps 10 25
No ratings yet
Introduction To ANN With Steps 10 25
30 pages
DL Record Merged
No ratings yet
DL Record Merged
113 pages
Deep Learning Experiments
No ratings yet
Deep Learning Experiments
42 pages
Keras - Datasets Keras - Datasets: "X - Train Shape" "Y - Train Shape" "X - Test Shape" "Y - Test Shape"
No ratings yet
Keras - Datasets Keras - Datasets: "X - Train Shape" "Y - Train Shape" "X - Test Shape" "Y - Test Shape"
6 pages
DLTF Lab Manual.1
No ratings yet
DLTF Lab Manual.1
29 pages
Quality Testing Resnet18 Compressed (1)
No ratings yet
Quality Testing Resnet18 Compressed (1)
13 pages
Assignment 02# - Machine Learning 2023
No ratings yet
Assignment 02# - Machine Learning 2023
8 pages
DL LAB MANUAL Mugesh
No ratings yet
DL LAB MANUAL Mugesh
12 pages
BLDD VIT ResNet50v2 CustomCNN
No ratings yet
BLDD VIT ResNet50v2 CustomCNN
38 pages
Introduction To Genetic Algorithm Neural Networks
No ratings yet
Introduction To Genetic Algorithm Neural Networks
44 pages
Assignment3 AL
No ratings yet
Assignment3 AL
23 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Lab 6
No ratings yet
Lab 6
29 pages
Ece265p Fahmy Day7
No ratings yet
Ece265p Fahmy Day7
93 pages
Chapter 12
No ratings yet
Chapter 12
61 pages
Chapter19 v2
No ratings yet
Chapter19 v2
54 pages
XML: Extensible Markup Language
No ratings yet
XML: Extensible Markup Language
35 pages
The Role of Multichannel Integration in CRM: Adrian Payne and Pennie Frow
No ratings yet
The Role of Multichannel Integration in CRM: Adrian Payne and Pennie Frow
9 pages
? Best AI Tools For SEO
No ratings yet
? Best AI Tools For SEO
4 pages
Fracktal Works - Application Engineer
No ratings yet
Fracktal Works - Application Engineer
2 pages
Communication Systems: Fourier Analysis
No ratings yet
Communication Systems: Fourier Analysis
11 pages
Micro Python
No ratings yet
Micro Python
21 pages
MSC It Thesis Topics
100% (3)
MSC It Thesis Topics
7 pages
Soumya Mukherjee 1219567
No ratings yet
Soumya Mukherjee 1219567
3 pages
Math644 - Chapter 1 - Part2 PDF
No ratings yet
Math644 - Chapter 1 - Part2 PDF
14 pages
2023-Def - Scriptie SerkanenKaplanoglu PatrickChu
No ratings yet
2023-Def - Scriptie SerkanenKaplanoglu PatrickChu
93 pages
Practical 19
No ratings yet
Practical 19
4 pages
Dynamic Analysis Program Development For A Wiper Linkage: W. H. Kim, T. W. Park, S. P. Jung and J. H. Lee, W. S. Chung
No ratings yet
Dynamic Analysis Program Development For A Wiper Linkage: W. H. Kim, T. W. Park, S. P. Jung and J. H. Lee, W. S. Chung
3 pages
Sodapdf
No ratings yet
Sodapdf
16 pages
Introduction To Matlab: Ross L. Spencer and Michael Ware
No ratings yet
Introduction To Matlab: Ross L. Spencer and Michael Ware
111 pages
Assignment Crypto Currency
No ratings yet
Assignment Crypto Currency
8 pages
Server Iron
No ratings yet
Server Iron
330 pages
How DHCP Works and DHCP Interview Questions and Answers
No ratings yet
How DHCP Works and DHCP Interview Questions and Answers
6 pages
What's The Difference?: Coordinate Systems
No ratings yet
What's The Difference?: Coordinate Systems
2 pages
Screenshot 2024-09-06 at 4.12.05 PM
No ratings yet
Screenshot 2024-09-06 at 4.12.05 PM
14 pages
012TEU-13188A2G - 12 Brins OM3 Armature en Mèches de Verre
No ratings yet
012TEU-13188A2G - 12 Brins OM3 Armature en Mèches de Verre
4 pages
MXK 319 819 823 PDF
No ratings yet
MXK 319 819 823 PDF
7 pages
Kashmore Shafiq Soomro CV Computer Programmer Operator Manager
100% (2)
Kashmore Shafiq Soomro CV Computer Programmer Operator Manager
1 page
Asia-Myanmar-HIKVISION-Turbo HD Products-D0T-SDP - 0501
No ratings yet
Asia-Myanmar-HIKVISION-Turbo HD Products-D0T-SDP - 0501
1 page
CCASBCM211
No ratings yet
CCASBCM211
56 pages
Power Off Reset Reason Backup
No ratings yet
Power Off Reset Reason Backup
5 pages
Movie Recommendation System-1
No ratings yet
Movie Recommendation System-1
25 pages
E Z Kriging
100% (3)
E Z Kriging
58 pages
MIcro End-Milling I - Wear and Breakage
No ratings yet
MIcro End-Milling I - Wear and Breakage
18 pages
Price Tag MERC
No ratings yet
Price Tag MERC
9 pages
The Clockwork Universein Chaos
No ratings yet
The Clockwork Universein Chaos
17 pages
Debug Dump 2
No ratings yet
Debug Dump 2
286 pages
S Cubed Datasheet
No ratings yet
S Cubed Datasheet
2 pages

HW4ML Project Starter Code Template

Uploaded by

HW4ML Project Starter Code Template

Uploaded by

Accuracy, Parameters Count, Training Time (s), Inference Latency (ms).

Accuracy/Parameters Count, Accuracy/Training Time

Writing a bonus paragraph about pruning % and compression impact?

def create_base_model(input_shape, num_classes):

x_train = x_train.astype('float32') / 255

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(dataset_name, max_epoch, device):

num_param = model.count_params() # counting number of model's

print(f"{dataset_name.upper()} Test Accuracy: {test_accuracy * 100:.2f}

return model, num_param, x_test, test_accuracy, train_time, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

prediction = model(image, training=False)

# Device priority: CUDA > MPS > CPU

Phase-3 code starter template

assert tf.__version__=='2.15.0', 'WARNING!!! different TensorFlow version may

def create_base_model(input_shape, num_classes):

x_train = x_train.astype('float32') / 255

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(model, x_test, y_test, device):

def profile_workload(model, device, dev_name, image, iterations=30):

def profile_tflite_model(interpreter, input_tensor, iterations=30):

def quantize_model_to_int8(model, representative_data_gen,

print(f"INT8 Quantized model saved at {save_path}")

def evaluate_tflite_accuracy(tflite_model_path, x_test, y_test):

datasets = ['fashion_mnist', 'cifar10']

for dataset in datasets:

(x_train, y_train), (x_test, y_test), input_shape, num_classes =

early_stop = EarlyStopping(monitor='val_loss', patience=3,

test_acc_fp32, eval_time_fp32 = evaluate_model(model, x_test, y_test,

test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)

# Save original model

# Accuracy after quantization

# Inference latency after quantization

You might also like

assert tf.version=='2.15.0', 'WARNING!!! different TensorFlow version may