0% found this document useful (0 votes)

8 views6 pages

HW4ML Project Starter Code Template

The document provides code templates for evaluating and profiling machine learning models using TensorFlow, specifically for the Fashion MNIST and CIFAR-10 datasets. It includes functions for model creation, dataset preparation, evaluation, and quantization to INT8 format, along with profiling for inference latency. Additionally, it emphasizes the importance of ensuring code correctness and discusses the impact of model pruning and compression on performance metrics.

Uploaded by

Amal

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

8 views6 pages

HW4ML Project Starter Code Template

Uploaded by

Amal

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 6

Accuracy, Parameters Count, Training Time (s), Inference Latency (ms).

Accuracy/Parameters Count, Accuracy/Training Time

Writing a bonus paragraph about pruning % and compression impact?

Phase-1 code starter template

The below code is for your reference; please feel free to change it partially or
fully.

Please make sure it does not have any bugs or mistakes. Code authors DO NOT claim
the code is bug-free. It is the student's responsibility to ensure its correctness.

import tensorflow as tf
from tensorflow.keras import layers, models
from tensorflow.keras.datasets import fashion_mnist, cifar10
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.callbacks import EarlyStopping
import time
import numpy as np
from tqdm import tqdm

def create_base_model(input_shape, num_classes):

model = models.Sequential([
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Flatten(),
layers.Dense(2, activation='relu'),
layers.Dense(num_classes, activation='softmax')
])
model.compile(optimizer='adam',
loss='categorical_crossentropy',
metrics=['accuracy'])
return model

def prepare_dataset(dataset_name):
if dataset_name == 'fashion_mnist':
(x_train, y_train), (x_test, y_test) = fashion_mnist.load_data()
num_classes = 10
input_shape = (28, 28, 1)
x_train = x_train.reshape(-1, 28, 28, 1)
x_test = x_test.reshape(-1, 28, 28, 1)
elif dataset_name == 'cifar10':
(x_train, y_train), (x_test, y_test) = cifar10.load_data()
num_classes = 10
input_shape = (32, 32, 3)
else:
raise ValueError(f"Unsupported dataset: {dataset_name}")

x_train = x_train.astype('float32') / 255

x_test = x_test.astype('float32') / 255
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(dataset_name, max_epoch, device):

(x_train, y_train), (x_test, y_test), input_shape, num_classes =
prepare_dataset(dataset_name)

with tf.device(device):
model = create_base_model(input_shape, num_classes)
early_stop = EarlyStopping(monitor='val_loss', patience=3,
restore_best_weights=True)
start_time = time.time()
model.fit(x_train, y_train, epochs=max_epoch, batch_size=64,
validation_split=0.2,
callbacks=[early_stop], verbose=1)
train_time = time.time() - start_time

start_time = time.time()
test_loss, test_accuracy = model.evaluate(x_test, y_test, verbose=0)
eval_time = time.time() - start_time

num_param = model.count_params() # counting number of model's

parameters

print(f"{dataset_name.upper()} Test Accuracy: {test_accuracy * 100:.2f}

%")
print(f"{dataset_name.upper()} Number of Parameters: {num_param}")

return model, num_param, x_test, test_accuracy, train_time, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

print(f"Profiling on {dev_name}...")
latencies = []
with tf.device(device):
for _ in tqdm(range(10), desc="Warm-up..."):
start = time.time()
_ = model(image, training=False)
for _ in tqdm(range(iterations), desc="Profiling"):
start = time.time()
_ = model(image, training=False)
latencies.append((time.time() - start) * 1000)

avg_latency = np.mean(latencies)
print(f"Average Latency on {dev_name}: {avg_latency:.2f} ms")

prediction = model(image, training=False)

predicted_class = tf.argmax(prediction, axis=1).numpy()[0]
print(f"Predicted Class: {predicted_class}")
return avg_latency

# Device priority: CUDA > MPS > CPU

if tf.config.list_physical_devices('GPU'):
device = '/GPU:0'
dev_name = 'GPU'
elif tf.config.list_physical_devices('MPS'):
device = '/MPS:0'
dev_name = 'Apple MPS'
else:
device = '/CPU:0'
dev_name = 'CPU'
print(f'using {dev_name}')
datasets = ['fashion_mnist', 'cifar10']
for dataset in datasets:
print(f"\nProcessing {dataset}...")
model, num_param, x_test, acc, train_t, eval_t = evaluate_model(dataset,
max_epoch=25, device=device)
test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)
profile_workload(model, device, dev_name, test_image)

Phase-3 code starter template

The below code is for your reference; please feel free to change it partially or
fully.

Please make sure it does not have any bugs or mistakes. Code authors DO NOT claim
the code is bug-free. It is the student's responsibility to ensure its correctness.

assert tf.version=='2.15.0', 'WARNING!!! different TensorFlow version may

produce an error while quantizing.'

def create_base_model(input_shape, num_classes):

model = models.Sequential([
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Conv2D(16, (3, 3), activation='relu', input_shape=input_shape),
layers.MaxPooling2D((2, 2)),
layers.Flatten(),
layers.Dense(2, activation='relu'),
layers.Dense(num_classes, activation='softmax')
])
model.compile(optimizer='adam',
loss='categorical_crossentropy',
metrics=['accuracy'])
return model

x_train = x_train.astype('float32') / 255

x_test = x_test.astype('float32') / 255
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(model, x_test, y_test, device):

with tf.device(device):
start_time = time.time()
loss, acc = model.evaluate(x_test, y_test, verbose=0)
eval_time = time.time() - start_time
return acc, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

print(f"Profiling on {dev_name}...")
latencies = []
with tf.device(device):
for _ in tqdm(range(10), desc="Warm-up"):
_ = model(image, training=False)
for _ in tqdm(range(iterations), desc="Profiling"):
start = time.time()
_ = model(image, training=False)
latencies.append((time.time() - start) * 1000)

avg_latency = np.mean(latencies)
print(f"Average Latency on {dev_name}: {avg_latency:.2f} ms")
return avg_latency

def profile_tflite_model(interpreter, input_tensor, iterations=30):

input_details = interpreter.get_input_details()
output_details = interpreter.get_output_details()
latencies = []

for _ in range(10):
interpreter.set_tensor(input_details[0]['index'], input_tensor)
interpreter.invoke()

for _ in range(iterations):
start = time.time()
interpreter.set_tensor(input_details[0]['index'], input_tensor)
interpreter.invoke()
latencies.append((time.time() - start) * 1000)

avg_latency = np.mean(latencies)
return avg_latency

def quantize_model_to_int8(model, representative_data_gen,

save_path="model_int8.tflite"):
converter = tf.lite.TFLiteConverter.from_keras_model(model)
converter.optimizations = [tf.lite.Optimize.DEFAULT]
converter.representative_dataset = representative_data_gen
converter.target_spec.supported_ops = [tf.lite.OpsSet.TFLITE_BUILTINS_INT8]
converter.inference_input_type = tf.int8
converter.inference_output_type = tf.int8

tflite_quant_model = converter.convert()
with open(save_path, "wb") as f:
f.write(tflite_quant_model)

print(f"INT8 Quantized model saved at {save_path}")

def get_file_size(file_path):
return os.path.getsize(file_path) / 1024 # KB

def evaluate_tflite_accuracy(tflite_model_path, x_test, y_test):

interpreter = tf.lite.Interpreter(model_path=tflite_model_path)
interpreter.allocate_tensors()

input_details = interpreter.get_input_details()
output_details = interpreter.get_output_details()

correct = 0
total = x_test.shape[0]
for i in range(total):
input_data = np.round(x_test[i:i+1] * 255).astype(np.int8) # <- FIXED
interpreter.set_tensor(input_details[0]['index'], input_data)
interpreter.invoke()
output = interpreter.get_tensor(output_details[0]['index'])
if np.argmax(output) == np.argmax(y_test[i]):
correct += 1
accuracy = correct / total
return accuracy

# -------------------
# Main Code
# -------------------
if tf.config.list_physical_devices('GPU'):
device = '/GPU:0'
dev_name = 'GPU'
elif tf.config.list_physical_devices('MPS'):
device = '/MPS:0'
dev_name = 'Apple MPS'
else:
device = '/CPU:0'
dev_name = 'CPU'
print(f'Using {dev_name}')

datasets = ['fashion_mnist', 'cifar10']

for dataset in datasets:

print(f"\nProcessing {dataset}...")

(x_train, y_train), (x_test, y_test), input_shape, num_classes =

prepare_dataset(dataset)

with tf.device(device):
model = create_base_model(input_shape, num_classes)

early_stop = EarlyStopping(monitor='val_loss', patience=3,

restore_best_weights=True)
start_train = time.time()
model.fit(x_train, y_train, epochs=25, batch_size=64,
validation_split=0.2,
callbacks=[early_stop], verbose=1)
train_time = time.time() - start_train

test_acc_fp32, eval_time_fp32 = evaluate_model(model, x_test, y_test,

device)
num_params = model.count_params()

test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)

orig_latency = profile_workload(model, device, dev_name, test_image)

# Save original model

model.save('model_fp32.h5')
fp32_size = get_file_size('model_fp32.h5')
print(f"Original Model Size: {fp32_size:.2f} KB")

# Quantization
def representative_data_gen():
for input_value in
tf.data.Dataset.from_tensor_slices(x_test).batch(1).take(100):
yield [tf.cast(input_value * 255.0, tf.float32)]

quantize_model_to_int8(model, representative_data_gen,
save_path="model_int8.tflite")
int8_size = get_file_size("model_int8.tflite")
print(f"Quantized Model Size: {int8_size:.2f} KB")

# Accuracy after quantization

test_acc_int8 = evaluate_tflite_accuracy("model_int8.tflite", x_test,
y_test)

# Inference latency after quantization

interpreter = tf.lite.Interpreter(model_path="model_int8.tflite")
interpreter.allocate_tensors()
input_details = interpreter.get_input_details()
test_image_int8 = np.round(x_test[:1] * 255).astype(np.int8)
int8_latency = profile_tflite_model(interpreter, test_image_int8)

print("\nSummary:")
print(f"{'Metric':<25} {'Before Quantization':<20} {'After Quantization'}")
print(f"{'-'*70}")
print(f"{'Number of Parameters':<25} {num_params:<20} {num_params}")
print(f"{'Test Accuracy (%)':<25} {test_acc_fp32*100:.2f}%{'':<12}
{test_acc_int8*100:.2f}%")
print(f"{'Training Time (s)':<25} {train_time:.2f}{'':<16} {'-'}")
print(f"{'Evaluation Time (s)':<25} {eval_time_fp32:.4f}{'':<14} {'-'}")
print(f"{'Inference Latency (ms)':<25} {orig_latency:.2f}{'':<14}
{int8_latency:.2f}")
print(f"{'Model Size (KB)':<25} {fp32_size:.2f}{'':<14} {int8_size:.2f}")

DLV Lab Manual Print
No ratings yet
DLV Lab Manual Print
29 pages
Deep Learning Practical File
No ratings yet
Deep Learning Practical File
36 pages
IJCSDF 7 4 Forensic Investigation Whatsapp
100% (1)
IJCSDF 7 4 Forensic Investigation Whatsapp
11 pages
HW4ML Project Code
No ratings yet
HW4ML Project Code
24 pages
Assignment 02# - Machine Learning 2023
No ratings yet
Assignment 02# - Machine Learning 2023
8 pages
Apex For Bres 1
No ratings yet
Apex For Bres 1
6 pages
Keras - Datasets Keras - Datasets: "X - Train Shape" "Y - Train Shape" "X - Test Shape" "Y - Test Shape"
No ratings yet
Keras - Datasets Keras - Datasets: "X - Train Shape" "Y - Train Shape" "X - Test Shape" "Y - Test Shape"
6 pages
DL 3 Ks
No ratings yet
DL 3 Ks
6 pages
Neural Network
No ratings yet
Neural Network
10 pages
Raw Nitex
No ratings yet
Raw Nitex
5 pages
A3 - Jupyter Notebook PDF
No ratings yet
A3 - Jupyter Notebook PDF
5 pages
Hand Written
No ratings yet
Hand Written
13 pages
TMA01 Question 1 (45 Marks)
No ratings yet
TMA01 Question 1 (45 Marks)
31 pages
01 249212 012 10129792044 11122022 112910pm
No ratings yet
01 249212 012 10129792044 11122022 112910pm
8 pages
ANN Detection Technique
No ratings yet
ANN Detection Technique
20 pages
CNN TF Keras
No ratings yet
CNN TF Keras
6 pages
DL Practical 6,7 Outputs
No ratings yet
DL Practical 6,7 Outputs
9 pages
(23mca24) Practical 1 & Practical 2
No ratings yet
(23mca24) Practical 1 & Practical 2
6 pages
CSE488 - Lab8 - TensorFlow II
No ratings yet
CSE488 - Lab8 - TensorFlow II
9 pages
Deep Learning Lab With Output
No ratings yet
Deep Learning Lab With Output
12 pages
Final Code
No ratings yet
Final Code
16 pages
DL Prac03IT
No ratings yet
DL Prac03IT
7 pages
Numerical Methods in Quantum Mechanics PDF
100% (1)
Numerical Methods in Quantum Mechanics PDF
101 pages
Klaas Dellschaft Dissertation
100% (2)
Klaas Dellschaft Dissertation
8 pages
Deep Learning Lab Manual
No ratings yet
Deep Learning Lab Manual
11 pages
BLDD VIT ResNet50v2 CustomCNN
No ratings yet
BLDD VIT ResNet50v2 CustomCNN
38 pages
Handwritten Digit Recognition Using A Neural Network
No ratings yet
Handwritten Digit Recognition Using A Neural Network
4 pages
VGG16 Estudo
No ratings yet
VGG16 Estudo
10 pages
CVcode
No ratings yet
CVcode
4 pages
Ass 3
No ratings yet
Ass 3
5 pages
DL Practical 3
No ratings yet
DL Practical 3
5 pages
DL Exps
No ratings yet
DL Exps
9 pages
Lab Manual
No ratings yet
Lab Manual
45 pages
Practical 2: Amtics Enrollment No: 202203103510493
No ratings yet
Practical 2: Amtics Enrollment No: 202203103510493
6 pages
MNIST Tensorflow Mini Project 1749471354
No ratings yet
MNIST Tensorflow Mini Project 1749471354
4 pages
Applied Machine and Deep Learning
No ratings yet
Applied Machine and Deep Learning
34 pages
NNDL 2
No ratings yet
NNDL 2
67 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
Deep Learning
No ratings yet
Deep Learning
30 pages
Deep Learning Practical
No ratings yet
Deep Learning Practical
12 pages
DL Programs
No ratings yet
DL Programs
12 pages
Nndlrepo 2
No ratings yet
Nndlrepo 2
3 pages
Skill 7
No ratings yet
Skill 7
11 pages
Exp. No.: I. Aim: AIML634P Neural Network Lab 2262034
No ratings yet
Exp. No.: I. Aim: AIML634P Neural Network Lab 2262034
6 pages
DL Record Merged
No ratings yet
DL Record Merged
113 pages
Introduction To ANN With Steps 10 25
No ratings yet
Introduction To ANN With Steps 10 25
30 pages
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
No ratings yet
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
39 pages
Assignment3 AL
No ratings yet
Assignment3 AL
23 pages
1729492946538
No ratings yet
1729492946538
10 pages
This Python Script Implements A Single
No ratings yet
This Python Script Implements A Single
6 pages
Nndlmac
No ratings yet
Nndlmac
9 pages
Introduction To Genetic Algorithm Neural Networks
No ratings yet
Introduction To Genetic Algorithm Neural Networks
44 pages
DLTF Lab Manual.1
No ratings yet
DLTF Lab Manual.1
29 pages
DL LAB MANUAL Mugesh
No ratings yet
DL LAB MANUAL Mugesh
12 pages
Deep Learning
No ratings yet
Deep Learning
46 pages
Python Deep Learning Lab Programs
No ratings yet
Python Deep Learning Lab Programs
35 pages
Pioneer+Deh p5780mp
No ratings yet
Pioneer+Deh p5780mp
82 pages
Deep Learning Experiments
No ratings yet
Deep Learning Experiments
42 pages
Brain Tumour Classification
No ratings yet
Brain Tumour Classification
10 pages
Deep Learning Lab With Tensorflow
No ratings yet
Deep Learning Lab With Tensorflow
84 pages
12mahmoud El Saeed Sakr CV2
No ratings yet
12mahmoud El Saeed Sakr CV2
2 pages
Neural DEEP
No ratings yet
Neural DEEP
39 pages
The Role of Multichannel Integration in CRM: Adrian Payne and Pennie Frow
No ratings yet
The Role of Multichannel Integration in CRM: Adrian Payne and Pennie Frow
9 pages
Deep Learning Programs Updated
No ratings yet
Deep Learning Programs Updated
24 pages
Fg2c Fg3c Manual
No ratings yet
Fg2c Fg3c Manual
44 pages
GNUSim8085 Assembly Language Guide
100% (1)
GNUSim8085 Assembly Language Guide
3 pages
Data Mining and Warehousing
No ratings yet
Data Mining and Warehousing
18 pages
EMS Cert Qs
No ratings yet
EMS Cert Qs
22 pages
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
No ratings yet
Introduction To Systems Analysis and Design:: An Agile, Iterative Approach
49 pages
NNDL Lab Record
No ratings yet
NNDL Lab Record
26 pages
Chapter 12
No ratings yet
Chapter 12
61 pages
Chapter19 v2
No ratings yet
Chapter19 v2
54 pages
XML: Extensible Markup Language
No ratings yet
XML: Extensible Markup Language
35 pages
Sony Blu-Ray Player BDP-S190 PDF
No ratings yet
Sony Blu-Ray Player BDP-S190 PDF
32 pages
Machine Learning Approaches For Soil Type Classification in
No ratings yet
Machine Learning Approaches For Soil Type Classification in
20 pages
JVM Overview Content
No ratings yet
JVM Overview Content
10 pages
Attention-Based CRNN Models For Identification of Respiratory Diseases From Lung Sounds
No ratings yet
Attention-Based CRNN Models For Identification of Respiratory Diseases From Lung Sounds
7 pages
Fire Exit Plan
No ratings yet
Fire Exit Plan
5 pages
IASSim A Programmable Emulator For The Princeton I
No ratings yet
IASSim A Programmable Emulator For The Princeton I
7 pages
Gmail - London Met - Conditional Offer 24019555 - Global Human Resource Management - (GSBL)
No ratings yet
Gmail - London Met - Conditional Offer 24019555 - Global Human Resource Management - (GSBL)
5 pages
CIMATRON Sketcher
No ratings yet
CIMATRON Sketcher
71 pages
Distributed Database Concepts
No ratings yet
Distributed Database Concepts
35 pages
Ece265p Fahmy Day7
No ratings yet
Ece265p Fahmy Day7
93 pages
LS2208 Spec Sheet
No ratings yet
LS2208 Spec Sheet
2 pages
DE THI HK 2-LOP 10-20232024 - 570 - Dap An
No ratings yet
DE THI HK 2-LOP 10-20232024 - 570 - Dap An
4 pages
Google Classroom Codes
No ratings yet
Google Classroom Codes
1 page
Computer Integrated Manufacturing - Assignment 1
No ratings yet
Computer Integrated Manufacturing - Assignment 1
3 pages
Advanced Phrasal Verb Challenge Day 10 Exercise
No ratings yet
Advanced Phrasal Verb Challenge Day 10 Exercise
3 pages
Lab 6
No ratings yet
Lab 6
29 pages
Verisure Fast-Ii: Product Specifications
No ratings yet
Verisure Fast-Ii: Product Specifications
1 page
HP Jet Fusion 5200, 5210, 5210 Pro 3D Printing Solution - Certificate of Origin
No ratings yet
HP Jet Fusion 5200, 5210, 5210 Pro 3D Printing Solution - Certificate of Origin
1 page
IP 31 Series Online UPS: Technical Specifications
100% (1)
IP 31 Series Online UPS: Technical Specifications
1 page
Dec - 2022 BCS-053
No ratings yet
Dec - 2022 BCS-053
4 pages
Indicative Specification For Mobile X-Ray Unit
No ratings yet
Indicative Specification For Mobile X-Ray Unit
14 pages
The Three-Wire Quarter-Bridge Circuit
No ratings yet
The Three-Wire Quarter-Bridge Circuit
4 pages
Kovács György - Bakosi Éva - Játék Az Óvódában
100% (3)
Kovács György - Bakosi Éva - Játék Az Óvódában
239 pages
Comp 1 Reviewer
No ratings yet
Comp 1 Reviewer
5 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

Note: This service is not intended for secure transactions such as banking, social media, email, or purchasing. Use at your own risk. We assume no liability whatsoever for broken pages.

HW4ML Project Starter Code Template

Uploaded by

HW4ML Project Starter Code Template

Uploaded by

Accuracy, Parameters Count, Training Time (s), Inference Latency (ms).

Accuracy/Parameters Count, Accuracy/Training Time

Writing a bonus paragraph about pruning % and compression impact?

def create_base_model(input_shape, num_classes):

x_train = x_train.astype('float32') / 255

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(dataset_name, max_epoch, device):

num_param = model.count_params() # counting number of model's

print(f"{dataset_name.upper()} Test Accuracy: {test_accuracy * 100:.2f}

return model, num_param, x_test, test_accuracy, train_time, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

prediction = model(image, training=False)

# Device priority: CUDA > MPS > CPU

Phase-3 code starter template

assert tf.version=='2.15.0', 'WARNING!!! different TensorFlow version may

def create_base_model(input_shape, num_classes):

x_train = x_train.astype('float32') / 255

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(model, x_test, y_test, device):

def profile_workload(model, device, dev_name, image, iterations=30):

def profile_tflite_model(interpreter, input_tensor, iterations=30):

def quantize_model_to_int8(model, representative_data_gen,

print(f"INT8 Quantized model saved at {save_path}")

def evaluate_tflite_accuracy(tflite_model_path, x_test, y_test):

datasets = ['fashion_mnist', 'cifar10']

for dataset in datasets:

(x_train, y_train), (x_test, y_test), input_shape, num_classes =

early_stop = EarlyStopping(monitor='val_loss', patience=3,

test_acc_fp32, eval_time_fp32 = evaluate_model(model, x_test, y_test,

test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)

# Save original model

# Accuracy after quantization

# Inference latency after quantization

You might also like

Pfad - The Proxy pFad of © 2024 Garber Painting. All rights reserved.

HW4ML Project Starter Code Template

Uploaded by

HW4ML Project Starter Code Template

Uploaded by

Accuracy, Parameters Count, Training Time (s), Inference Latency (ms).

Accuracy/Parameters Count, Accuracy/Training Time

Writing a bonus paragraph about pruning % and compression impact?

def create_base_model(input_shape, num_classes):

x_train = x_train.astype('float32') / 255

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(dataset_name, max_epoch, device):

num_param = model.count_params() # counting number of model's

print(f"{dataset_name.upper()} Test Accuracy: {test_accuracy * 100:.2f}

return model, num_param, x_test, test_accuracy, train_time, eval_time

def profile_workload(model, device, dev_name, image, iterations=30):

prediction = model(image, training=False)

# Device priority: CUDA > MPS > CPU

Phase-3 code starter template

assert tf.__version__=='2.15.0', 'WARNING!!! different TensorFlow version may

def create_base_model(input_shape, num_classes):

x_train = x_train.astype('float32') / 255

return (x_train, y_train), (x_test, y_test), input_shape, num_classes

def evaluate_model(model, x_test, y_test, device):

def profile_workload(model, device, dev_name, image, iterations=30):

def profile_tflite_model(interpreter, input_tensor, iterations=30):

def quantize_model_to_int8(model, representative_data_gen,

print(f"INT8 Quantized model saved at {save_path}")

def evaluate_tflite_accuracy(tflite_model_path, x_test, y_test):

datasets = ['fashion_mnist', 'cifar10']

for dataset in datasets:

(x_train, y_train), (x_test, y_test), input_shape, num_classes =

early_stop = EarlyStopping(monitor='val_loss', patience=3,

test_acc_fp32, eval_time_fp32 = evaluate_model(model, x_test, y_test,

test_image = tf.convert_to_tensor(x_test[:1], dtype=tf.float32)

# Save original model

# Accuracy after quantization

# Inference latency after quantization

You might also like

Pfad - The Proxy pFad of © 2024 Garber Painting. All rights reserved.

assert tf.version=='2.15.0', 'WARNING!!! different TensorFlow version may