import warnings
import os
warnings.filterwarnings("ignore")
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2' 

import tensorflow as tf
from tensorflow.keras import utils, datasets, layers, models
import matplotlib.pyplot as plt
import numpy as np

import matplotlib as mpl
import pickle
import csv
import itertools
from collections import defaultdict
import time
import pandas as pd
import math
from tqdm import tqdm
import dill

2023-10-28 19:03:51.509111: E tensorflow/stream_executor/cuda/cuda_blas.cc:2981] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered


gpus = tf.config.experimental.list_physical_devices('GPU')
if gpus:
    try:
        # Currently, memory growth needs to be the same across GPUs
        for gpu in gpus:
            tf.config.experimental.set_memory_growth(gpu, True)
        tf.config.experimental.set_visible_devices(gpus[1], 'GPU')
        logical_gpus = tf.config.experimental.list_logical_devices('GPU')
        print(len(gpus), "Physical GPUs,", len(logical_gpus), "Logical GPUs")
    except RuntimeError as e:
        # Memory growth must be set before GPUs have been initialized
        print(e)

4 Physical GPUs, 1 Logical GPUs


import urllib.request
if not os.path.exists("lab11_1_lib.py"):
    urllib.request.urlretrieve("https://nthu-datalab.github.io/ml/labs/11-1_CNN/lab11_1_lib.py", "lab11_1_lib.py")

from lab11_1_lib import draw_timeline


# Download and prepare the MNIST dataset
(train_image, train_label), (test_image, test_label) = datasets.mnist.load_data()

# Normalize pixel values to be between 0 and 1
train_image, test_image = train_image / 255.0, test_image / 255.0
print('shape of train_image:', train_image.shape)
print('shape of train_label:', train_label.shape)

shape of train_image: (60000, 28, 28)
shape of train_label: (60000,)


# flating the training data for dense layers
train_image_1 = train_image.reshape((60000, -1))
test_image_1 = test_image.reshape((10000, -1))
print(train_image_1.shape)
print(test_image_1.shape)

(60000, 784)
(10000, 784)


model_1 = models.Sequential()
model_1.add(layers.Dense(10, activation='softmax',input_shape=(784,)))
model_1.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 dense (Dense)               (None, 10)                7850      
                                                                 
=================================================================
Total params: 7,850
Trainable params: 7,850
Non-trainable params: 0
_________________________________________________________________


# compile the model and train it for 3 epochs
model_1.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

model_1.fit(train_image_1, train_label, epochs=5)

Epoch 1/5
1875/1875 [==============================] - 6s 3ms/step - loss: 0.4647 - accuracy: 0.8791
Epoch 2/5
1875/1875 [==============================] - 5s 3ms/step - loss: 0.3031 - accuracy: 0.9156
Epoch 3/5
1875/1875 [==============================] - 5s 3ms/step - loss: 0.2830 - accuracy: 0.9211
Epoch 4/5
1875/1875 [==============================] - 5s 3ms/step - loss: 0.2729 - accuracy: 0.9235
Epoch 5/5
1875/1875 [==============================] - 5s 3ms/step - loss: 0.2668 - accuracy: 0.9259

<keras.callbacks.History at 0x7fd74031a490>


_, test_acc_1 = model_1.evaluate(test_image_1, test_label, verbose=0)
print('Testing Accuracy : %.4f'%test_acc_1)

Testing Accuracy : 0.9244


# reshaping the training data to 3 dimensions
train_image_2 = train_image.reshape((60000, 28, 28, 1))
test_image_2 = test_image.reshape((10000, 28, 28, 1))
print(train_image_2.shape)
print(test_image_2.shape)

(60000, 28, 28, 1)
(10000, 28, 28, 1)


#The 6 lines of code below define the convolutional base using a common pattern: a stack of Conv2D and MaxPooling2D layers.
model_2 = models.Sequential()
model_2.add(layers.Conv2D(32, (3, 3), strides=(1,1), padding='valid', activation='relu', input_shape=(28, 28, 1)))
model_2.add(layers.MaxPooling2D((2, 2)))
model_2.add(layers.Conv2D(64, (3, 3), strides=(1,1), padding='valid', activation='relu'))
model_2.add(layers.MaxPooling2D((2, 2)))
model_2.add(layers.Conv2D(64, (3, 3), strides=(1,1), padding='valid', activation='relu'))


model_2.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 conv2d (Conv2D)             (None, 26, 26, 32)        320       
                                                                 
 max_pooling2d (MaxPooling2D  (None, 13, 13, 32)       0         
 )                                                               
                                                                 
 conv2d_1 (Conv2D)           (None, 11, 11, 64)        18496     
                                                                 
 max_pooling2d_1 (MaxPooling  (None, 5, 5, 64)         0         
 2D)                                                             
                                                                 
 conv2d_2 (Conv2D)           (None, 3, 3, 64)          36928     
                                                                 
=================================================================
Total params: 55,744
Trainable params: 55,744
Non-trainable params: 0
_________________________________________________________________


model_2.add(layers.Flatten())
model_2.add(layers.Dense(64, activation='relu'))
model_2.add(layers.Dropout(0.5))
model_2.add(layers.Dense(10, activation='softmax'))


model_2.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 conv2d (Conv2D)             (None, 26, 26, 32)        320       
                                                                 
 max_pooling2d (MaxPooling2D  (None, 13, 13, 32)       0         
 )                                                               
                                                                 
 conv2d_1 (Conv2D)           (None, 11, 11, 64)        18496     
                                                                 
 max_pooling2d_1 (MaxPooling  (None, 5, 5, 64)         0         
 2D)                                                             
                                                                 
 conv2d_2 (Conv2D)           (None, 3, 3, 64)          36928     
                                                                 
 flatten (Flatten)           (None, 576)               0         
                                                                 
 dense_1 (Dense)             (None, 64)                36928     
                                                                 
 dropout (Dropout)           (None, 64)                0         
                                                                 
 dense_2 (Dense)             (None, 10)                650       
                                                                 
=================================================================
Total params: 93,322
Trainable params: 93,322
Non-trainable params: 0
_________________________________________________________________


model_2.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

model_2.fit(train_image_2, train_label, epochs=5)

Epoch 1/5
1875/1875 [==============================] - 13s 6ms/step - loss: 0.2837 - accuracy: 0.9125
Epoch 2/5
1875/1875 [==============================] - 11s 6ms/step - loss: 0.0905 - accuracy: 0.9751
Epoch 3/5
1875/1875 [==============================] - 11s 6ms/step - loss: 0.0646 - accuracy: 0.9819
Epoch 4/5
1875/1875 [==============================] - 11s 6ms/step - loss: 0.0508 - accuracy: 0.9856
Epoch 5/5
1875/1875 [==============================] - 11s 6ms/step - loss: 0.0418 - accuracy: 0.9876

<keras.callbacks.History at 0x7fd7400adcd0>


_, test_acc_2 = model_2.evaluate(test_image_2, test_label, verbose=0)
print('Testing Accuracy : %.4f'%test_acc_2)

Testing Accuracy : 0.9912


# Loading Data

(X_train, y_train), (X_test, y_test) = datasets.cifar10.load_data()

# normalize inputs from 0-255 to 0.0-1.0
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')
X_train = X_train / 255.0
X_test = X_test / 255.0

# convert class vectors to binary vectors
Y_train = utils.to_categorical(y_train)
Y_test = utils.to_categorical(y_test)

print('X_train shape:', X_train.shape)
print('Y_train shape:', Y_train.shape)
print('X_test shape:', X_test.shape)
print('Y_test shape:', Y_test.shape)

X_train shape: (50000, 32, 32, 3)
Y_train shape: (50000, 10)
X_test shape: (10000, 32, 32, 3)
Y_test shape: (10000, 10)


# transform a 3-channel image into one channel
def grayscale(data, dtype='float32'):
    # luma coding weighted average in video systems
    r = np.asarray(.3, dtype=dtype)
    g = np.asarray(.59, dtype=dtype)
    b = np.asarray(.11, dtype=dtype)
    rst = r * data[:, :, :, 0] + g * data[:, :, :, 1] + b * data[:, :, :, 2]
    # add channel dimension
    rst = np.expand_dims(rst, axis=3)
    return rst

X_train_gray = grayscale(X_train)
X_test_gray = grayscale(X_test)

# plot a randomly chosen image
img = round(np.random.rand() * X_train.shape[0])
plt.figure(figsize=(4, 2))
plt.subplot(1, 2, 1)
plt.imshow(X_train[img], interpolation='none')
plt.subplot(1, 2, 2)
plt.imshow(
    X_train_gray[img, :, :, 0], cmap=plt.get_cmap('gray'), interpolation='none')
plt.show()


def getHOGfeat(image,
               stride=8,
               orientations=8,
               pixels_per_cell=(8, 8),
               cells_per_block=(2, 2)):
    cx, cy = pixels_per_cell
    bx, by = cells_per_block
    sx, sy, sz = image.shape
    n_cellsx = int(np.floor(sx // cx))  # number of cells in x
    n_cellsy = int(np.floor(sy // cy))  # number of cells in y
    n_blocksx = (n_cellsx - bx) + 1
    n_blocksy = (n_cellsy - by) + 1
    gx = np.zeros((sx, sy), dtype=np.double)
    gy = np.zeros((sx, sy), dtype=np.double)
    eps = 1e-5
    grad = np.zeros((sx, sy, 2), dtype=np.double)
    for i in range(1, sx - 1):
        for j in range(1, sy - 1):
            gx[i, j] = image[i, j - 1] - image[i, j + 1]
            gy[i, j] = image[i + 1, j] - image[i - 1, j]
            grad[i, j, 0] = np.arctan(gy[i, j] / (gx[i, j] + eps)) * 180 / math.pi
            if gx[i, j] < 0:
                grad[i, j, 0] += 180
            grad[i, j, 0] = (grad[i, j, 0] + 360) % 360
            grad[i, j, 1] = np.sqrt(gy[i, j] ** 2 + gx[i, j] ** 2)
    normalised_blocks = np.zeros((n_blocksy, n_blocksx, by * bx * orientations))
    for y in range(n_blocksy):
        for x in range(n_blocksx):
            block = grad[y * stride:y * stride + 16, x * stride:x * stride + 16]
            hist_block = np.zeros(32, dtype=np.double)
            eps = 1e-5
            for k in range(by):
                for m in range(bx):
                    cell = block[k * 8:(k + 1) * 8, m * 8:(m + 1) * 8]
                    hist_cell = np.zeros(8, dtype=np.double)
                    for i in range(cy):
                        for j in range(cx):
                            n = int(cell[i, j, 0] / 45)
                            hist_cell[n] += cell[i, j, 1]
                    hist_block[(k * bx + m) * orientations:(k * bx + m + 1) * orientations] = hist_cell[:]
            normalised_blocks[y, x, :] = hist_block / np.sqrt(
                hist_block.sum() ** 2 + eps)
    return normalised_blocks.ravel()


X_train_hog = []
X_test_hog = []

print('This will take some minutes.')

for img in tqdm(X_train_gray):
    img_hog = getHOGfeat(img)
    X_train_hog.append(img_hog)

for img in tqdm(X_test_gray):
    img_hog = getHOGfeat(img)
    X_test_hog.append(img_hog)
    
X_train_hog_array = np.asarray(X_train_hog)
X_test_hog_array = np.asarray(X_test_hog)

This will take some minutes.

100%|████████████████████████████████████| 50000/50000 [05:31<00:00, 150.88it/s]
100%|████████████████████████████████████| 10000/10000 [01:06<00:00, 151.50it/s]


# KNN
from sklearn.neighbors import KNeighborsClassifier 
from sklearn.metrics import accuracy_score

# p=2 and metric='minkowski' means the Euclidean Distance
knn = KNeighborsClassifier(n_neighbors=11, p=2, metric='minkowski')

knn.fit(X_train_hog_array, y_train.ravel())
y_pred = knn.predict(X_test_hog_array)
print('[KNN]')
print('Misclassified samples: %d' % (y_test.ravel() != y_pred).sum())
print('Accuracy: %.2f' % accuracy_score(y_test, y_pred))

[KNN]
Misclassified samples: 5334
Accuracy: 0.47


# SVM
from sklearn.svm import SVC 

print('This will take some minutes.')
start_time = time.time()

# C is the hyperparameter for the error penalty term
# gamma is the hyperparameter for the rbf kernel
svm_linear = SVC(kernel='linear', random_state=0, gamma=0.2, C=10.0)

svm_linear.fit(X_train_hog_array, y_train.ravel())
y_pred = svm_linear.predict(X_test_hog_array)
print('[Linear SVC]')
print('Misclassified samples: %d' % (y_test.ravel() != y_pred).sum())
print('Accuracy: %.2f' % accuracy_score(y_test.ravel(), y_pred))

print('{:.2f} sec.'.format(time.time()-start_time))

This will take some minutes.
[Linear SVC]
Misclassified samples: 4940
Accuracy: 0.51
495.08 sec.


model_3 = models.Sequential()

#The 6 lines of code below define the convolutional base using a common pattern: a stack of Conv2D and MaxPooling2D layers.
model_3.add(layers.Conv2D(64, (5, 5), padding='same', activation='relu', input_shape=(32, 32, 3)))
model_3.add(layers.MaxPool2D(pool_size=3,strides=2,padding='same'))
model_3.add(layers.BatchNormalization())
model_3.add(layers.Conv2D(64, (5, 5), padding='same', activation='relu'))
model_3.add(layers.MaxPool2D(pool_size=3,strides=2,padding='same'))
model_3.add(layers.BatchNormalization())
                
model_3.add(layers.Flatten())
model_3.add(layers.Dense(384, activation='relu'))
model_3.add(layers.Dropout(0.5))
model_3.add(layers.Dense(192, activation='relu'))
model_3.add(layers.Dense(10, activation='softmax'))
model_3.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

model_3.summary()

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 conv2d_3 (Conv2D)           (None, 32, 32, 64)        4864      
                                                                 
 max_pooling2d_2 (MaxPooling  (None, 16, 16, 64)       0         
 2D)                                                             
                                                                 
 batch_normalization (BatchN  (None, 16, 16, 64)       256       
 ormalization)                                                   
                                                                 
 conv2d_4 (Conv2D)           (None, 16, 16, 64)        102464    
                                                                 
 max_pooling2d_3 (MaxPooling  (None, 8, 8, 64)         0         
 2D)                                                             
                                                                 
 batch_normalization_1 (Batc  (None, 8, 8, 64)         256       
 hNormalization)                                                 
                                                                 
 flatten_1 (Flatten)         (None, 4096)              0         
                                                                 
 dense_3 (Dense)             (None, 384)               1573248   
                                                                 
 dropout_1 (Dropout)         (None, 384)               0         
                                                                 
 dense_4 (Dense)             (None, 192)               73920     
                                                                 
 dense_5 (Dense)             (None, 10)                1930      
                                                                 
=================================================================
Total params: 1,756,938
Trainable params: 1,756,682
Non-trainable params: 256
_________________________________________________________________


model_3.fit(X_train, y_train, epochs=5, validation_data=(X_test, y_test), verbose=1)
_, test_acc_3 = model_3.evaluate(X_test, y_test, verbose=0)
print('Testing Accuracy : %.4f'%test_acc_3)

Epoch 1/5
1563/1563 [==============================] - 13s 8ms/step - loss: 1.6064 - accuracy: 0.4281 - val_loss: 1.3853 - val_accuracy: 0.5148
Epoch 2/5
1563/1563 [==============================] - 12s 8ms/step - loss: 1.1151 - accuracy: 0.6074 - val_loss: 1.1946 - val_accuracy: 0.5959
Epoch 3/5
1563/1563 [==============================] - 12s 8ms/step - loss: 0.9340 - accuracy: 0.6749 - val_loss: 1.0923 - val_accuracy: 0.6232
Epoch 4/5
1563/1563 [==============================] - 12s 8ms/step - loss: 0.8215 - accuracy: 0.7152 - val_loss: 1.0149 - val_accuracy: 0.6511
Epoch 5/5
1563/1563 [==============================] - 11s 7ms/step - loss: 0.7306 - accuracy: 0.7488 - val_loss: 0.8527 - val_accuracy: 0.7087
Testing Accuracy : 0.7087


# number of samples
n_samples = 200

# an array with shape (n_samples, 5)
raw_data_a = np.random.rand(n_samples, 5)
# a list with length of n_samples from 0 to n_samples-1
raw_data_b = np.arange(n_samples)
print(raw_data_a.shape, raw_data_b.shape)

(200, 5) (200,)


# this tells the dataset that each row of raw_data_a is corresponding to each element of raw_data_b
raw_dataset = tf.data.Dataset.from_tensor_slices((raw_data_a, raw_data_b))


# Here, we print the first 8 batches.
for i,elem in enumerate(raw_dataset):
    print("Batch ", i, ", b are ", elem)
    if i==7:
        break

Batch  0 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.66931552, 0.60461851, 0.48526867, 0.35751424, 0.42699349])>, <tf.Tensor: shape=(), dtype=int64, numpy=0>)
Batch  1 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.84717025, 0.3991303 , 0.76538914, 0.67931079, 0.23154431])>, <tf.Tensor: shape=(), dtype=int64, numpy=1>)
Batch  2 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.25540675, 0.80812385, 0.04000756, 0.45713614, 0.97573978])>, <tf.Tensor: shape=(), dtype=int64, numpy=2>)
Batch  3 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.0938586 , 0.6594527 , 0.02701433, 0.31752666, 0.44325064])>, <tf.Tensor: shape=(), dtype=int64, numpy=3>)
Batch  4 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.73322097, 0.48946239, 0.3686729 , 0.04317379, 0.74173232])>, <tf.Tensor: shape=(), dtype=int64, numpy=4>)
Batch  5 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.02034684, 0.05158959, 0.71902387, 0.61182723, 0.23348519])>, <tf.Tensor: shape=(), dtype=int64, numpy=5>)
Batch  6 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.18205827, 0.70072316, 0.37018672, 0.11622035, 0.43881617])>, <tf.Tensor: shape=(), dtype=int64, numpy=6>)
Batch  7 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.70428993, 0.00845075, 0.02440134, 0.90915499, 0.30298183])>, <tf.Tensor: shape=(), dtype=int64, numpy=7>)


# Here, we print the first 8 batches.
it = iter(raw_dataset)
for i in range(8):
    print("Batch ", i, ", b are ", next(it))

Batch  0 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.66931552, 0.60461851, 0.48526867, 0.35751424, 0.42699349])>, <tf.Tensor: shape=(), dtype=int64, numpy=0>)
Batch  1 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.84717025, 0.3991303 , 0.76538914, 0.67931079, 0.23154431])>, <tf.Tensor: shape=(), dtype=int64, numpy=1>)
Batch  2 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.25540675, 0.80812385, 0.04000756, 0.45713614, 0.97573978])>, <tf.Tensor: shape=(), dtype=int64, numpy=2>)
Batch  3 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.0938586 , 0.6594527 , 0.02701433, 0.31752666, 0.44325064])>, <tf.Tensor: shape=(), dtype=int64, numpy=3>)
Batch  4 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.73322097, 0.48946239, 0.3686729 , 0.04317379, 0.74173232])>, <tf.Tensor: shape=(), dtype=int64, numpy=4>)
Batch  5 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.02034684, 0.05158959, 0.71902387, 0.61182723, 0.23348519])>, <tf.Tensor: shape=(), dtype=int64, numpy=5>)
Batch  6 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.18205827, 0.70072316, 0.37018672, 0.11622035, 0.43881617])>, <tf.Tensor: shape=(), dtype=int64, numpy=6>)
Batch  7 , b are  (<tf.Tensor: shape=(5,), dtype=float64, numpy=array([0.70428993, 0.00845075, 0.02440134, 0.90915499, 0.30298183])>, <tf.Tensor: shape=(), dtype=int64, numpy=7>)


def preprocess_function(one_row_a, one_b):
    """
        Input: one slice of the dataset
        Output: modified slice
    """
    # Do some data preprocessing, you can also input filenames and load data in here
    # Here, we transform each row of raw_data_a to its sum and mean
    one_row_a = [tf.reduce_sum(one_row_a), tf.reduce_mean(one_row_a)]

    return one_row_a, one_b

raw_dataset = raw_dataset.map(preprocess_function, num_parallel_calls=tf.data.experimental.AUTOTUNE)


it = iter(raw_dataset)
for i in range(8):
    print("Batch ", i, ", b are ", next(it))

Batch  0 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.54371044, 0.50874209])>, <tf.Tensor: shape=(), dtype=int64, numpy=0>)
Batch  1 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.92254479, 0.58450896])>, <tf.Tensor: shape=(), dtype=int64, numpy=1>)
Batch  2 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.53641408, 0.50728282])>, <tf.Tensor: shape=(), dtype=int64, numpy=2>)
Batch  3 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([1.54110293, 0.30822059])>, <tf.Tensor: shape=(), dtype=int64, numpy=3>)
Batch  4 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.37626237, 0.47525247])>, <tf.Tensor: shape=(), dtype=int64, numpy=4>)
Batch  5 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([1.63627272, 0.32725454])>, <tf.Tensor: shape=(), dtype=int64, numpy=5>)
Batch  6 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([1.80800466, 0.36160093])>, <tf.Tensor: shape=(), dtype=int64, numpy=6>)
Batch  7 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([1.94927884, 0.38985577])>, <tf.Tensor: shape=(), dtype=int64, numpy=7>)


dataset = raw_dataset.shuffle(16)


idxs = []
for i,elem in enumerate(dataset):
    print("Batch ", i, ", b are ", elem)
    idxs.append(elem[1].numpy())
    if i==7:
        break
        
print("\nThe order of the first 8 shuffle from [0, 1, 2, 3, 4, 5, 6, 7] to ",idxs)

Batch  0 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.24929143, 0.44985829])>, <tf.Tensor: shape=(), dtype=int64, numpy=13>)
Batch  1 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.51418351, 0.5028367 ])>, <tf.Tensor: shape=(), dtype=int64, numpy=8>)
Batch  2 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.52106856, 0.50421371])>, <tf.Tensor: shape=(), dtype=int64, numpy=17>)
Batch  3 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.01846541, 0.40369308])>, <tf.Tensor: shape=(), dtype=int64, numpy=10>)
Batch  4 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([3.15692468, 0.63138494])>, <tf.Tensor: shape=(), dtype=int64, numpy=12>)
Batch  5 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.27690284, 0.45538057])>, <tf.Tensor: shape=(), dtype=int64, numpy=16>)
Batch  6 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([2.54371044, 0.50874209])>, <tf.Tensor: shape=(), dtype=int64, numpy=0>)
Batch  7 , b are  (<tf.Tensor: shape=(2,), dtype=float64, numpy=array([3.28908268, 0.65781654])>, <tf.Tensor: shape=(), dtype=int64, numpy=19>)

The order of the first 8 shuffle from [0, 1, 2, 3, 4, 5, 6, 7] to  [13, 8, 17, 10, 12, 16, 0, 19]


dataset = dataset.batch(2, drop_remainder=False)


idxs = []
for i,elem in enumerate(dataset):
    print("Batch ", i, ", b are ", elem)
    print("")
    idxs.append(elem[1].numpy())
    if i==7:
        break
        
print("\nAfter `dataset.batch(2)`,\nBatch 0 is combined by %dth and %dth,\nBatch 1 is combined by %dth and %dth,\nBatch 2 is combined by %dth and %dth, etc."%(idxs[0][0],idxs[0][1],idxs[1][0],idxs[1][1],idxs[2][0],idxs[2][1]))

Batch  0 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[2.51418351, 0.5028367 ],
       [2.24929143, 0.44985829]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([ 8, 13])>)

Batch  1 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[2.92254479, 0.58450896],
       [2.54371044, 0.50874209]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([1, 0])>)

Batch  2 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[1.80800466, 0.36160093],
       [1.54110293, 0.30822059]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([6, 3])>)

Batch  3 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[3.28908268, 0.65781654],
       [2.27690284, 0.45538057]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([19, 16])>)

Batch  4 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[1.94927884, 0.38985577],
       [2.32019   , 0.464038  ]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([7, 9])>)

Batch  5 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[2.01846541, 0.40369308],
       [2.09043057, 0.41808611]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([10, 24])>)

Batch  6 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[2.67089385, 0.53417877],
       [2.37626237, 0.47525247]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([26,  4])>)

Batch  7 , b are  (<tf.Tensor: shape=(2, 2), dtype=float64, numpy=
array([[3.49696451, 0.6993929 ],
       [2.53641408, 0.50728282]])>, <tf.Tensor: shape=(2,), dtype=int64, numpy=array([14,  2])>)


After `dataset.batch(2)`,
Batch 0 is combined by 8th and 13th,
Batch 1 is combined by 1th and 0th,
Batch 2 is combined by 6th and 3th, etc.


dataset = dataset.repeat(2)


epochs = 3

for epoch in range(epochs):
    size = 0
    n_batch = 0
    for batch in dataset:
        size += len(batch[1])
        n_batch += 1
    print("End of epoch %d: Total %d batches in this epoch with %d pieces of data"%(epoch, n_batch, size))

End of epoch 0: Total 200 batches in this epoch with 400 pieces of data
End of epoch 1: Total 200 batches in this epoch with 400 pieces of data
End of epoch 2: Total 200 batches in this epoch with 400 pieces of data


dataset = dataset.prefetch(buffer_size=tf.data.experimental.AUTOTUNE)


# use this function to plot the size of each batch.
def plot_batch_sizes(ds,title):
    batch_sizes = [batch[1].shape[0] for batch in ds]
    plt.bar(range(len(batch_sizes)), batch_sizes)
    plt.xlabel('Batch number')
    plt.ylabel('Batch size')
    plt.title(title)
    plt.show()


# plot the bar diagram of repeat+batch
repeat_batch_ds = raw_dataset.repeat(3).batch(32)
plot_batch_sizes(repeat_batch_ds,'repeat+batch')


# plot the bar diagram of batch+repeat
batch_repeat_ds = raw_dataset.batch(32).repeat(3)
plot_batch_sizes(batch_repeat_ds,'batch+repeat')


# You can find that a repeat before a shuffle mixes the epoch boundaries in this graph.
shuffle_repeat_ds = raw_dataset.shuffle(32).repeat(3).batch(16)
repeat_shuffle_ds = raw_dataset.repeat(3).shuffle(32).batch(16)

shuffle_repeat = [batch[1].numpy().mean() for batch in shuffle_repeat_ds]
repeat_shuffle = [batch[1].numpy().mean() for batch in repeat_shuffle_ds]

plt.plot(shuffle_repeat, label="shuffle().repeat()")
plt.plot(repeat_shuffle, label="repeat().shuffle()")
plt.xlabel('Batch number')
plt.ylabel("Mean of b in each batch")
plt.legend()

<matplotlib.legend.Legend at 0x7fd9111fbb80>


# the url to download CIFAR-10 dataset (binary version)
# see format and details here: http://www.cs.toronto.edu/~kriz/cifar.html
DATA_URL = 'https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz'
# the image size we want to keep
IMAGE_SIZE_CROPPED = 24
IMAGE_HEIGHT = 32
IMAGE_WIDTH = 32
IMAGE_DEPTH = 3


# donwnload data
if not os.path.exists("cifar-10-batches-py/"): 
    cifar10 = utils.get_file('cifar-10-python.tar.gz',
                                      cache_subdir=os.path.abspath('.'),
                                      origin = DATA_URL,
                                      extract = True)


DEST_DIRECTORY = 'cifar-10-batches-py'
filenames_train = [os.path.join(DEST_DIRECTORY,'data_batch_%d' % i) for i in range(1,6)]
filenames_test = [os.path.join(DEST_DIRECTORY,'test_batch')]


# save (img_path, label) pairs
with open('cifar10_train.csv', 'w', newline='') as csvfile:
    writer = csv.writer(csvfile)
    writer.writerow(['filenames'])
    writer.writerows(np.array(filenames_train).reshape(-1,1))
        
with open('cifar10_test.csv', 'w', newline='') as csvfile:
    writer = csv.writer(csvfile)
    writer.writerow(['filenames'])
    writer.writerows(np.array(filenames_test).reshape(-1,1))


# read data
def read_file(file):
    with open(file, 'rb') as fo:
        raw_data = pickle.load(fo, encoding='bytes')
    return raw_data[b'data'],raw_data[b'labels']

# parse training data
@tf.function
def map_fun(image,label):
    image = tf.reshape(image,[IMAGE_DEPTH,IMAGE_HEIGHT,IMAGE_WIDTH])
    image = tf.divide(tf.cast(tf.transpose(image,[1,2,0]),tf.float32),255.0)
    label = tf.one_hot(label,10)
    distorted_image = tf.image.resize_with_crop_or_pad(image, IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED)
    distorted_image = tf.image.random_flip_left_right(distorted_image)
    distorted_image = tf.image.random_brightness(distorted_image, max_delta=63)
    distorted_image = tf.image.random_contrast(distorted_image, lower=0.2, upper=1.8)
    distorted_image = tf.image.per_image_standardization(distorted_image)
    return distorted_image, label

# parse testing data
@tf.function
def map_fun_test(image,label):
    image = tf.reshape(image,[IMAGE_DEPTH,IMAGE_HEIGHT,IMAGE_WIDTH])
    image = tf.divide(tf.cast(tf.transpose(image,[1,2,0]),tf.float32),255.0)
    label = tf.one_hot(label,10)
    distorted_image = tf.image.resize_with_crop_or_pad(image, IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED)
    distorted_image = tf.image.per_image_standardization(distorted_image)
    return distorted_image, label


X_train = None
Y_train = None
X_test = None
Y_test = None

for filename in filenames_train:
    image,label = read_file(filename)
    X_train = image if X_train is None else np.concatenate((X_train,image))
    Y_train = label if Y_train is None else np.concatenate((Y_train,label))

for filename in filenames_test:
    image,label = read_file(filename)
    X_test = image if X_test is None else np.concatenate((X_test,image))
    Y_test = label if Y_test is None else np.concatenate((Y_test,label))

# Construct training Dataset
dataset = tf.data.Dataset.from_tensor_slices((X_train,Y_train)).map(map_fun).shuffle(10000).batch(64)

# # Construct testing Dataset
dataset_test = tf.data.Dataset.from_tensor_slices((X_test,Y_test)).map(map_fun_test).batch(64)


model_cifar = models.Sequential()

model_cifar.add(layers.Conv2D(64, (5, 5), padding='same', activation='relu', input_shape=(24, 24, 3)))
model_cifar.add(layers.MaxPool2D(pool_size=3,strides=2,padding='same'))
model_cifar.add(layers.BatchNormalization())
                
model_cifar.add(layers.Conv2D(64, (5, 5), padding='same', activation='relu'))
model_cifar.add(layers.MaxPool2D(pool_size=3,strides=2,padding='same'))
model_cifar.add(layers.BatchNormalization())
                
model_cifar.add(layers.Flatten())
model_cifar.add(layers.Dense(384, activation='relu'))
model_cifar.add(layers.Dropout(0.5))
model_cifar.add(layers.Dense(192, activation='relu'))
model_cifar.add(layers.Dropout(0.5))
model_cifar.add(layers.Dense(10, activation='softmax'))


model_cifar.compile(optimizer='adam',
              loss='categorical_crossentropy',
              metrics=['accuracy'])
model_cifar.summary()

Model: "sequential_3"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 conv2d_5 (Conv2D)           (None, 24, 24, 64)        4864      
                                                                 
 max_pooling2d_4 (MaxPooling  (None, 12, 12, 64)       0         
 2D)                                                             
                                                                 
 batch_normalization_2 (Batc  (None, 12, 12, 64)       256       
 hNormalization)                                                 
                                                                 
 conv2d_6 (Conv2D)           (None, 12, 12, 64)        102464    
                                                                 
 max_pooling2d_5 (MaxPooling  (None, 6, 6, 64)         0         
 2D)                                                             
                                                                 
 batch_normalization_3 (Batc  (None, 6, 6, 64)         256       
 hNormalization)                                                 
                                                                 
 flatten_2 (Flatten)         (None, 2304)              0         
                                                                 
 dense_6 (Dense)             (None, 384)               885120    
                                                                 
 dropout_2 (Dropout)         (None, 384)               0         
                                                                 
 dense_7 (Dense)             (None, 192)               73920     
                                                                 
 dropout_3 (Dropout)         (None, 192)               0         
                                                                 
 dense_8 (Dense)             (None, 10)                1930      
                                                                 
=================================================================
Total params: 1,068,810
Trainable params: 1,068,554
Non-trainable params: 256
_________________________________________________________________


model_cifar.fit(dataset, epochs=5, validation_data=dataset_test, verbose=1)
_, test_acc = model_cifar.evaluate(dataset_test, verbose=0)
print('test accuracy:',test_acc)

Epoch 1/5
782/782 [==============================] - 15s 17ms/step - loss: 1.7770 - accuracy: 0.3714 - val_loss: 1.3185 - val_accuracy: 0.5377
Epoch 2/5
782/782 [==============================] - 15s 17ms/step - loss: 1.3668 - accuracy: 0.5230 - val_loss: 1.1346 - val_accuracy: 0.6129
Epoch 3/5
782/782 [==============================] - 14s 16ms/step - loss: 1.1993 - accuracy: 0.5868 - val_loss: 0.9907 - val_accuracy: 0.6583
Epoch 4/5
782/782 [==============================] - 15s 17ms/step - loss: 1.0905 - accuracy: 0.6259 - val_loss: 0.9453 - val_accuracy: 0.6792
Epoch 5/5
782/782 [==============================] - 14s 16ms/step - loss: 1.0106 - accuracy: 0.6553 - val_loss: 0.8773 - val_accuracy: 0.7092
test accuracy: 0.7092000246047974


# construct a new dataset with time informantion
class TimeMeasuredDataset(tf.data.Dataset):
    # OUTPUT: (steps, timings, counters, img, label)
    OUTPUT_SIGNATURE=(
        tf.TensorSpec(shape=(2, 1), dtype=tf.string), # steps: [("Open",), ("Read",)]
        tf.TensorSpec(shape=(2, 2), dtype=tf.float32), # timings: [(open_enter, open_elapsed), (read_enter, read_elapsed)]
        tf.TensorSpec(shape=(2, 3), dtype=tf.int32), # counters: [(instance_idx, epoch_idx, -1), (instance_idx, epoch_idx, example_idx)]
        tf.TensorSpec(shape=(3072), dtype=tf.float32), # img: 32*32*3
        tf.TensorSpec(shape=(), dtype=tf.int32) # label
    )

    _INSTANCES_COUNTER = itertools.count()  # Number of datasets generated
    _EPOCHS_COUNTER = defaultdict(itertools.count)  # Number of epochs done for each dataset

    def _generator(instance_idx, filename, open_file, read_file):
        epoch_idx = next(TimeMeasuredDataset._EPOCHS_COUNTER[instance_idx])

        # Opening the file
        open_enter = time.perf_counter()
        filenames = open_file(filename)
        open_elapsed = time.perf_counter() - open_enter
        # ----------------
        
        # Reading the file
        read_enter = time.perf_counter()
        imgs, label = [], []
        for filename in filenames:
            tmp_imgs, tmp_label = read_file(filename)
            imgs.append(tmp_imgs)
            label.append(tmp_label)
        imgs = tf.concat(imgs, axis=0)
        label = tf.concat(label, axis=0)
        read_elapsed = (time.perf_counter() - read_enter) / imgs.shape[0]
        
        for sample_idx in range(imgs.shape[0]):
            read_enter = read_enter if sample_idx == 0 else time.perf_counter()
            
            yield (
                [("Open",), ("Read",)],
                [(open_enter, open_elapsed), (read_enter, read_elapsed)],
                [(instance_idx, epoch_idx, -1), (instance_idx, epoch_idx, sample_idx)],
                imgs[sample_idx],
                label[sample_idx]
            )
            open_enter, open_elapsed = -1., -1.  # Negative values will be filtered


    def __new__(cls, filename, open_file, read_file):
        def generator_func(instance_idx, filename):
            return cls._generator(instance_idx, filename, open_file, read_file)

        return tf.data.Dataset.from_generator(
            generator_func,
            output_signature=cls.OUTPUT_SIGNATURE,
            args=(next(cls._INSTANCES_COUNTER), filename)
        )


def open_file(filename):
    rows = pd.read_csv(filename.decode("utf-8"))
    filenames = rows['filenames']
    return filenames

def read_file(filename):
    with open(filename, 'rb') as fo:
        raw_data = pickle.load(fo, encoding='bytes')
    return raw_data[b'data'], raw_data[b'labels']

def dataset_generator_fun_train(*args):
    return TimeMeasuredDataset('cifar10_train.csv', open_file, read_file)

def dataset_generator_fun_test(*args):
    return TimeMeasuredDataset('cifar10_test.csv', open_file, read_file)

for i in tf.data.Dataset.range(1).flat_map(dataset_generator_fun_train).take(2):
    print(i)
    print("now time", time.perf_counter())
    print("-------------------------------------------------------------------------------")

(<tf.Tensor: shape=(2, 1), dtype=string, numpy=
array([[b'Open'],
       [b'Read']], dtype=object)>, <tf.Tensor: shape=(2, 2), dtype=float32, numpy=
array([[4.9066791e+05, 4.5651230e-03],
       [4.9066794e+05, 2.5628499e-06]], dtype=float32)>, <tf.Tensor: shape=(2, 3), dtype=int32, numpy=
array([[ 0,  0, -1],
       [ 0,  0,  0]], dtype=int32)>, <tf.Tensor: shape=(3072,), dtype=float32, numpy=array([ 59.,  43.,  50., ..., 140.,  84.,  72.], dtype=float32)>, <tf.Tensor: shape=(), dtype=int32, numpy=6>)
now time 490668.059314616
-------------------------------------------------------------------------------
(<tf.Tensor: shape=(2, 1), dtype=string, numpy=
array([[b'Open'],
       [b'Read']], dtype=object)>, <tf.Tensor: shape=(2, 2), dtype=float32, numpy=
array([[-1.0000000e+00, -1.0000000e+00],
       [ 4.9066806e+05,  2.5628499e-06]], dtype=float32)>, <tf.Tensor: shape=(2, 3), dtype=int32, numpy=
array([[ 0,  0, -1],
       [ 0,  0,  1]], dtype=int32)>, <tf.Tensor: shape=(3072,), dtype=float32, numpy=array([154., 126., 105., ..., 139., 142., 144.], dtype=float32)>, <tf.Tensor: shape=(), dtype=int32, numpy=9>)
now time 490668.063010501
-------------------------------------------------------------------------------


IMAGE_SIZE_CROPPED = 24
IMAGE_HEIGHT = 32
IMAGE_WIDTH = 32
IMAGE_DEPTH = 3

def map_decorator(func):
    def wrapper(steps, times, values, image, label):
        # Use a tf.py_function to prevent auto-graph from compiling the method
        return tf.py_function(
            func,
            inp=(steps, times, values, image, label),
            Tout=(steps.dtype, times.dtype, values.dtype, image.dtype, tf.float32)
        )
    return wrapper

@map_decorator
def map_fun_with_time(steps, times, values, image, label):
    # sleep to avoid concurrency issue
    time.sleep(0.05)
    
    # record the enter time into map_fun()
    map_enter = time.perf_counter()
    
    image = tf.reshape(image,[IMAGE_DEPTH, IMAGE_HEIGHT, IMAGE_WIDTH])
    image = tf.divide(tf.cast(tf.transpose(image,[1, 2, 0]),tf.float32),255.0)
    label = tf.one_hot(label, 10)
    distorted_image = tf.image.random_crop(image, [IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED,IMAGE_DEPTH])
    # distorted_image = tf.image.resize(image, [IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED])
    distorted_image = tf.image.random_flip_left_right(distorted_image)
    distorted_image = tf.image.random_brightness(distorted_image, max_delta=63)
    distorted_image = tf.image.random_contrast(distorted_image, lower=0.2, upper=1.8)
    distorted_image = tf.image.per_image_standardization(distorted_image)
    
    map_elapsed = time.perf_counter() - map_enter
    # ----------------
    
    return tf.concat((steps, [["Map"]]), axis=0),\
           tf.concat((times, [[map_enter, map_elapsed]]), axis=0),\
           tf.concat((values, [values[-1]]), axis=0),\
           distorted_image,\
           label

@map_decorator
def map_fun_test_with_time(steps, times, values, image, label):
    # sleep to avoid concurrency issue
    time.sleep(0.05)
    
    # record the enter time into map_fun_test()
    map_enter = time.perf_counter()
    
    image = tf.reshape(image,[IMAGE_DEPTH,IMAGE_HEIGHT,IMAGE_WIDTH])
    image = tf.divide(tf.cast(tf.transpose(image,[1,2,0]),tf.float32),255.0)
    label = tf.one_hot(label,10)
    distorted_image = tf.image.resize(image, [IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED])
    distorted_image = tf.image.per_image_standardization(distorted_image)
    
    map_elapsed = time.perf_counter() - map_enter
    # ----------------
    
    return tf.concat((steps, [["Map"]]), axis=0),\
           tf.concat((times, [[map_enter, map_elapsed]]), axis=0),\
           tf.concat((values, [values[-1]]), axis=0),\
           distorted_image,\
           label


for i in tf.data.Dataset.range(1).flat_map(dataset_generator_fun_train).map(map_fun_with_time).take(2):
    print(i)
    print("now time", time.perf_counter())
    print("-------------------------------------------------------------------------------")

(<tf.Tensor: shape=(3, 1), dtype=string, numpy=
array([[b'Open'],
       [b'Read'],
       [b'Map']], dtype=object)>, <tf.Tensor: shape=(3, 2), dtype=float32, numpy=
array([[4.9066819e+05, 2.9742192e-03],
       [4.9066819e+05, 2.3807518e-06],
       [4.9066838e+05, 4.5068976e-02]], dtype=float32)>, <tf.Tensor: shape=(3, 3), dtype=int32, numpy=
array([[ 1,  0, -1],
       [ 1,  0,  0],
       [ 1,  0,  0]], dtype=int32)>, <tf.Tensor: shape=(24, 24, 3), dtype=float32, numpy=
array([[[ 0.794585  ,  0.1525154 , -0.43435538],
        [ 0.794585  ,  0.20373973, -0.36603695],
        [ 0.48714247, -0.08662798, -0.6393299 ],
        ...,
        [ 0.94831586,  0.40871426, -0.1098188 ],
        [ 0.8458286 ,  0.2891522 , -0.21230607],
        [ 0.77751017,  0.27207744, -0.19521199]],

       [[ 0.40173   , -0.35992092, -1.1005033 ],
        [ 0.23092432, -0.49657702, -1.2029905 ],
        [ 0.06011866, -0.65028864, -1.3225526 ],
        ...,
        [ 0.35048637, -0.34284613, -1.0151101 ],
        [ 0.28216797, -0.42823932, -1.1005033 ],
        [ 0.33341157, -0.35992092, -0.98094124]],

       [[ 0.17968069, -0.53072655, -1.2200654 ],
        [ 0.16260591, -0.5136518 , -1.2029905 ],
        [ 0.16260591, -0.49657702, -1.1688217 ],
        ...,
        [ 0.26509318, -0.41116452, -1.1005033 ],
        [ 0.29924273, -0.41116452, -1.1005033 ],
        [ 0.11136229, -0.599045  , -1.23714   ]],

       ...,

       [[ 1.4607521 ,  0.989469  ,  0.5563291 ],
        [ 1.3582649 ,  0.818644  ,  0.30011094],
        [ 1.1703844 ,  0.4428831 , -0.2635497 ],
        ...,
        [ 0.45297363,  0.13542132, -1.2883837 ],
        [ 0.60670453,  0.13542132, -1.1859157 ],
        [ 1.3070213 ,  0.92115057, -0.53684264]],

       [[ 1.2387029 ,  0.47703266, -0.17813721],
        [ 1.204534  ,  0.47703266, -0.12689358],
        [ 1.477827  ,  0.7332508 ,  0.06098687],
        ...,
        [ 0.17968069,  0.23790859, -1.7837453 ],
        [ 0.77751017,  0.47703266, -1.2029905 ],
        [ 1.6486326 ,  1.2969115 , -0.21230607]],

       [[ 1.1362156 ,  0.22083381, -0.5710115 ],
        [ 1.1020467 ,  0.25498337, -0.46852422],
        [ 1.3070213 ,  0.56244516, -0.16106243],
        ...,
        [-0.00819975,  0.0841777 , -1.80082   ],
        [ 0.9653906 ,  0.69908196, -0.87845397],
        [ 1.4949018 ,  1.1261058 , -0.2635497 ]]], dtype=float32)>, <tf.Tensor: shape=(10,), dtype=float32, numpy=array([0., 0., 0., 0., 0., 0., 1., 0., 0., 0.], dtype=float32)>)
now time 490668.42789291
-------------------------------------------------------------------------------
(<tf.Tensor: shape=(3, 1), dtype=string, numpy=
array([[b'Open'],
       [b'Read'],
       [b'Map']], dtype=object)>, <tf.Tensor: shape=(3, 2), dtype=float32, numpy=
array([[-1.0000000e+00, -1.0000000e+00],
       [ 4.9066844e+05,  2.3807518e-06],
       [ 4.9066847e+05,  1.1549212e-02]], dtype=float32)>, <tf.Tensor: shape=(3, 3), dtype=int32, numpy=
array([[ 1,  0, -1],
       [ 1,  0,  1],
       [ 1,  0,  1]], dtype=int32)>, <tf.Tensor: shape=(24, 24, 3), dtype=float32, numpy=
array([[[ 0.47468224,  0.75477153,  0.97282755],
        [ 0.60898346,  0.90586287,  1.0399684 ],
        [-0.0289228 ,  0.1840257 ,  0.06633849],
        ...,
        [-1.1200638 , -1.1253278 , -1.3437556 ],
        [-0.83467126, -0.82316476, -1.142294  ],
        [-0.8850416 , -0.83995485, -1.3605261 ]],

       [[ 0.5082624 ,  0.72121096,  0.8049462 ],
        [ 0.5754032 ,  0.73800105,  0.73780537],
        [-0.16320443, -0.10134721, -0.25261462],
        ...,
        [-1.0025526 , -0.9910462 , -1.2765952 ],
        [-0.86825144, -0.83995485, -1.2094544 ],
        [-0.8011107 , -0.77281404, -1.2430346 ]],

       [[ 0.44110203,  0.6540505 ,  0.63708436],
        [ 0.5754032 ,  0.73800105,  0.67066455],
        [ 0.45789215,  0.5197689 ,  0.3852916 ],
        ...,
        [-1.0193232 , -0.9910462 , -1.3773162 ],
        [-0.9018317 , -0.8735351 , -1.2933853 ],
        [-1.0864836 , -1.058187  , -1.4780372 ]],

       ...,

       [[-1.3886466 , -1.461071  , -1.3101754 ],
        [-1.4893676 , -1.4946316 , -1.4612471 ],
        [-0.33108583, -0.11813731, -0.2694047 ],
        ...,
        [ 1.1629392 ,  0.8722827 , -0.05117261],
        [ 1.1293786 ,  0.82193196, -0.10152333],
        [ 1.146149  ,  0.7883518 , -0.16868371]],

       [[-1.3718565 , -1.4442809 , -1.2933853 ],
        [-1.3550664 , -1.37714   , -1.3773162 ],
        [-0.41501674, -0.28599912, -0.48761725],
        ...,
        [ 0.35717112,  0.1000948 , -0.58833826],
        [ 0.5082624 ,  0.2679566 , -0.45405665],
        [ 0.7600551 ,  0.45260853, -0.3701257 ]],

       [[-1.7915306 , -1.847165  , -1.74662   ],
        [-1.7915306 , -1.8303748 , -1.7802002 ],
        [-1.5732985 , -1.561792  , -1.5955483 ],
        ...,
        [-1.5229282 , -1.7967947 , -2.0823634 ],
        [-1.4725775 , -1.6793032 , -1.9648522 ],
        [-1.2543454 , -1.4946316 , -1.8809212 ]]], dtype=float32)>, <tf.Tensor: shape=(10,), dtype=float32, numpy=array([0., 0., 0., 0., 0., 0., 0., 0., 0., 1.], dtype=float32)>)
now time 490668.499416673
-------------------------------------------------------------------------------


steps_acc = tf.zeros([0, 1], dtype=tf.dtypes.string)
times_acc = tf.zeros([0, 2], dtype=tf.dtypes.float32)
values_acc = tf.zeros([0, 3], dtype=tf.dtypes.int32)

start_time = time.perf_counter()
print("start time: ", start_time)

for steps, times, values, image, label in tqdm(tf.data.Dataset.range(1).flat_map(dataset_generator_fun_train).map(map_fun_with_time).take(10)):    
    steps_acc = tf.concat((steps_acc, steps), axis=0)
    times_acc = tf.concat((times_acc, times), axis=0)
    values_acc = tf.concat((values_acc, values), axis=0)

    # simulate training time
    train_enter = time.perf_counter()
    time.sleep(0.1)
    train_elapsed = time.perf_counter() - train_enter
    
    steps_acc = tf.concat((steps_acc, [["Train"]]), axis=0)
    times_acc = tf.concat((times_acc, [(train_enter, train_elapsed)]), axis=0)
    values_acc = tf.concat((values_acc, [values[-1]]), axis=0)

tf.print("Execution time:", time.perf_counter() - start_time)
timeline = {"steps": steps_acc, "times": times_acc, "values": values_acc}

start time:  490668.527553598

10it [00:01,  5.19it/s]

Execution time: 1.975233745004516


from lab11_1_lib import draw_timeline

draw_timeline(timeline=timeline, title="test", min_width=1, annotate=True)


steps_acc = tf.zeros([0, 1], dtype=tf.dtypes.string)
times_acc = tf.zeros([0, 2], dtype=tf.dtypes.float32)
values_acc = tf.zeros([0, 3], dtype=tf.dtypes.int32)

start_time = time.perf_counter()
print("start time: ", start_time)

for steps, times, values, image, label in tqdm(tf.data.Dataset.range(1).flat_map(dataset_generator_fun_train).map(map_fun_with_time).batch(64).take(2)):
    '''
        steps: shape=(64, 3, 1)
        times: shape=(64, 3, 2)
        vaules: shape=(64, 3, 3)
        image: shape=(64, 24, 24, 3)
        label: shape=(64, 10)
    '''
    
    steps_acc = tf.concat([steps_acc, tf.reshape(steps, (steps.shape[0]*steps.shape[1], 1))], axis=0)
    times_acc = tf.concat([times_acc, tf.reshape(times, (times.shape[0]*times.shape[1], 2))], axis=0)
    values_acc = tf.concat([values_acc, tf.reshape(values, (values.shape[0]*values.shape[1], 3))], axis=0)

    train_enter = time.perf_counter()
    time.sleep(0.5) # simulate training time
    train_elapsed = time.perf_counter() - train_enter
    
    train_time = tf.concat([tf.fill([times.shape[0], 1], train_enter), tf.fill([times.shape[0], 1], train_elapsed)], axis=1) # shape=(times.shape[0], 2)
    
    steps_acc = tf.concat([steps_acc, tf.fill([steps.shape[0], 1], "Train")], axis=0)
    times_acc = tf.concat([times_acc, train_time], axis=0)
    values_acc = tf.concat([values_acc, values[:,-1,:]], axis=0)

tf.print("Execution time:", time.perf_counter() - start_time)
timeline = {"steps": steps_acc, "times": times_acc, "values": values_acc}

start time:  490670.882653565

2it [00:09,  4.73s/it]

Execution time: 9.501270917011425


draw_timeline(timeline=timeline, title="test_batch", min_width=1, annotate=True)


# re-construct a same model
model_cifar_op = models.Sequential()

model_cifar_op.add(layers.Conv2D(64, (5, 5), padding='same', activation='relu', input_shape=(24, 24, 3)))
model_cifar_op.add(layers.MaxPool2D(pool_size=3,strides=2,padding='same'))
model_cifar_op.add(layers.BatchNormalization())
                
model_cifar_op.add(layers.Conv2D(64, (5, 5), padding='same', activation='relu'))
model_cifar_op.add(layers.MaxPool2D(pool_size=3,strides=2,padding='same'))
model_cifar_op.add(layers.BatchNormalization())
                
model_cifar_op.add(layers.Flatten())
model_cifar_op.add(layers.Dense(384, activation='relu'))
model_cifar_op.add(layers.Dropout(0.5))
model_cifar_op.add(layers.Dense(192, activation='relu'))
model_cifar_op.add(layers.Dropout(0.5))
model_cifar_op.add(layers.Dense(10, activation='softmax'))
model_cifar_op.build()
model_cifar_op.summary()

Model: "sequential_4"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 conv2d_7 (Conv2D)           (None, 24, 24, 64)        4864      
                                                                 
 max_pooling2d_6 (MaxPooling  (None, 12, 12, 64)       0         
 2D)                                                             
                                                                 
 batch_normalization_4 (Batc  (None, 12, 12, 64)       256       
 hNormalization)                                                 
                                                                 
 conv2d_8 (Conv2D)           (None, 12, 12, 64)        102464    
                                                                 
 max_pooling2d_7 (MaxPooling  (None, 6, 6, 64)         0         
 2D)                                                             
                                                                 
 batch_normalization_5 (Batc  (None, 6, 6, 64)         256       
 hNormalization)                                                 
                                                                 
 flatten_3 (Flatten)         (None, 2304)              0         
                                                                 
 dense_9 (Dense)             (None, 384)               885120    
                                                                 
 dropout_4 (Dropout)         (None, 384)               0         
                                                                 
 dense_10 (Dense)            (None, 192)               73920     
                                                                 
 dropout_5 (Dropout)         (None, 192)               0         
                                                                 
 dense_11 (Dense)            (None, 10)                1930      
                                                                 
=================================================================
Total params: 1,068,810
Trainable params: 1,068,554
Non-trainable params: 256
_________________________________________________________________


# save the initialization of weights 
model_cifar_op.save_weights('model_cifar_op.h5')


# define loss and optimizer
loss_object = tf.keras.losses.CategoricalCrossentropy(from_logits=True)
optimizer = tf.keras.optimizers.Adam()

train_loss = tf.keras.metrics.Mean(name='train_loss')
train_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name='train_accuracy')

test_loss = tf.keras.metrics.Mean(name='test_loss')
test_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name='test_accuracy')


@tf.function
def train_step(image, label):
    with tf.GradientTape() as tape:
        predictions = model_cifar_op(image, training=True)
        loss = loss_object(label, predictions)
    gradients = tape.gradient(loss, model_cifar_op.trainable_variables)
    optimizer.apply_gradients(zip(gradients, model_cifar_op.trainable_variables))

    train_loss(loss)
    train_accuracy(tf.argmax(label,axis=1), predictions)
    
@tf.function
def test_step(image, label):
    predictions = model_cifar_op(image, training=False)
    t_loss = loss_object(label, predictions)

    test_loss(t_loss)
    test_accuracy(tf.argmax(label,axis=1), predictions)


def timelined_benchmark(dataset_train, dataset_test, EPOCHS):
    steps_acc = tf.zeros([0, 1], dtype=tf.dtypes.string)
    times_acc = tf.zeros([0, 2], dtype=tf.dtypes.float32)
    values_acc = tf.zeros([0, 3], dtype=tf.dtypes.int32)

    start_time = time.perf_counter()
    print("start time: ", start_time)
    for epoch in range(EPOCHS):
        epoch_enter = time.perf_counter()

        # Reset the metrics at the start of the next epoch
        train_loss.reset_states()
        train_accuracy.reset_states()
        test_loss.reset_states()
        test_accuracy.reset_states()

        tf.print("training:")
        for steps, times, values, image, label in tqdm(dataset_train, total=math.floor(50000/BATCH_SIZE)):
            # sleep to avoid concurrency issue
            time.sleep(0.05)
            
            steps_acc = tf.concat([steps_acc, tf.reshape(steps, (steps.shape[0]*steps.shape[1], 1))], axis=0)
            times_acc = tf.concat([times_acc, tf.reshape(times, (times.shape[0]*times.shape[1], 2))], axis=0)
            values_acc = tf.concat([values_acc, tf.reshape(values, (values.shape[0]*values.shape[1], 3))], axis=0)

            # record training time
            train_enter = time.perf_counter()
            train_step(image, label)
            train_elapsed = time.perf_counter() - train_enter
            
            # sleep to avoid concurrency issue
            time.sleep(0.05)
            
            train_time = tf.concat([tf.fill([times.shape[0], 1], train_enter), tf.fill([times.shape[0], 1], train_elapsed)], axis=1) # shape=(times.shape[0], 2)
            steps_acc = tf.concat([steps_acc, tf.fill([steps.shape[0], 1], "Train")], axis=0)
            times_acc = tf.concat([times_acc, train_time], axis=0)
            values_acc = tf.concat([values_acc, values[:,-1,:]], axis=0)

        tf.print("testing:")
        for steps, times, values, image, label in tqdm(dataset_test, total=math.floor(10000/BATCH_SIZE)):
            # sleep to avoid concurrency issue
            time.sleep(0.05)
            
            steps_acc = tf.concat([steps_acc, tf.reshape(steps, (steps.shape[0]*steps.shape[1], 1))], axis=0)
            times_acc = tf.concat([times_acc, tf.reshape(times, (times.shape[0]*times.shape[1], 2))], axis=0)
            values_acc = tf.concat([values_acc, tf.reshape(values, (values.shape[0]*values.shape[1], 3))], axis=0)

            test_enter = time.perf_counter()
            test_step(image, label)
            test_elapsed = time.perf_counter() - test_enter
            
            # sleep to avoid concurrency issue
            time.sleep(0.05)
            
            test_time = tf.concat([tf.fill([times.shape[0], 1], test_enter), tf.fill([times.shape[0], 1], test_elapsed)], axis=1) # shape=(times.shape[0], 2)
            steps_acc = tf.concat([steps_acc, tf.fill([steps.shape[0], 1], "Test")], axis=0)
            times_acc = tf.concat([times_acc, test_time], axis=0)
            values_acc = tf.concat([values_acc, values[:,-1,:]], axis=0)
            
        template = 'Epoch {:0}, Loss: {:.4f}, Accuracy: {:.4f}, test Loss: {:.4f}, test Accuracy: {:.4f}'
        tf.print (template.format(epoch+1,
                               train_loss.result(),
                               train_accuracy.result()*100,
                               test_loss.result(),
                               test_accuracy.result()*100))

        epoch_elapsed = time.perf_counter() - epoch_enter
        steps_acc = tf.concat([steps_acc, [["Epoch"]]], axis=0)
        times_acc = tf.concat([times_acc, [(epoch_enter, epoch_elapsed)]], axis=0)
        values_acc = tf.concat([values_acc, [[-1, epoch, -1]]], axis=0)

    tf.print("Execution time:", time.perf_counter() - start_time)
    return {"steps": steps_acc, "times": times_acc, "values": values_acc}


# feel free to modify these two Settings.
BUFFER_SIZE = 10000
BATCH_SIZE = 64

# Construct training Dataset with similar steps
dataset_train = tf.data.Dataset.range(1).flat_map(dataset_generator_fun_train)\
                                        .map(map_fun_with_time)\
                                        .shuffle(10000)\
                                        .batch(BATCH_SIZE, drop_remainder=True)
                                        
# Construct testing Dataset with similar steps
dataset_test = tf.data.Dataset.range(1).flat_map(dataset_generator_fun_test)\
                                       .map(map_fun_test_with_time)\
                                       .batch(BATCH_SIZE, drop_remainder=True)

timeline_Naive = timelined_benchmark(dataset_train, dataset_test, EPOCHS=2)

start time:  492394.487955699
training:

100%|█████████████████████████████████████████| 781/781 [58:23<00:00,  4.49s/it]

testing:

100%|█████████████████████████████████████████| 156/156 [10:30<00:00,  4.04s/it]

Epoch 1, Loss: 1.7187, Accuracy: 37.2259, test Loss: 1.4126, test Accuracy: 49.8698
training:

100%|█████████████████████████████████████████| 781/781 [58:25<00:00,  4.49s/it]

testing:

100%|█████████████████████████████████████████| 156/156 [10:28<00:00,  4.03s/it]

Epoch 2, Loss: 1.4753, Accuracy: 47.3712, test Loss: 1.2083, test Accuracy: 57.8125
Execution time: 8268.120533703011


draw_timeline(timeline=timeline_Naive, title="Naive", min_width=8500)


@map_decorator
def map_fun_with_time_batchwise(steps, times, values, image, label):
    # sleep to avoid concurrency issue
    time.sleep(0.05)
    
    map_enter = time.perf_counter()
    
    image = tf.reshape(image,[tf.shape(image)[0], IMAGE_DEPTH, IMAGE_HEIGHT, IMAGE_WIDTH])
    image = tf.divide(tf.cast(tf.transpose(image,[0, 2, 3, 1]),tf.float32),255.0)
    label = tf.one_hot(label, 10)
    distorted_image = tf.image.random_crop(image, [tf.shape(image)[0], IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED,IMAGE_DEPTH])
    distorted_image = tf.image.random_flip_left_right(distorted_image)
    distorted_image = tf.image.random_brightness(distorted_image, max_delta=63)
    distorted_image = tf.image.random_contrast(distorted_image, lower=0.2, upper=1.8)
    distorted_image = tf.image.per_image_standardization(distorted_image)
    
    map_elapsed = time.perf_counter() - map_enter

    return tf.concat((steps, tf.tile([[["Map"]]], [BATCH_SIZE, 1, 1])), axis=1),\
           tf.concat((times, tf.tile([[[map_enter, map_elapsed]]], [BATCH_SIZE, 1, 1])), axis=1),\
           tf.concat((values, tf.tile([[values[:][-1][0]]], [BATCH_SIZE, 1, 1])), axis=1),\
           distorted_image,\
           label

@map_decorator
def map_fun_test_with_time_batchwise(steps, times, values, image, label):
    # sleep to avoid concurrency issue
    time.sleep(0.05)
    
    map_enter = time.perf_counter()
    
    image = tf.reshape(image,[tf.shape(image)[0],IMAGE_DEPTH,IMAGE_HEIGHT,IMAGE_WIDTH])
    image = tf.divide(tf.cast(tf.transpose(image,[0, 2, 3, 1]),tf.float32),255.0)
    label = tf.one_hot(label,10)
    distorted_image = tf.image.resize(image, [IMAGE_SIZE_CROPPED,IMAGE_SIZE_CROPPED])
    distorted_image = tf.image.per_image_standardization(distorted_image)
    
    map_elapsed = time.perf_counter() - map_enter
    
    return tf.concat((steps, tf.tile([[["Map"]]], [BATCH_SIZE, 1, 1])), axis=1),\
           tf.concat((times, tf.tile([[[map_enter, map_elapsed]]], [BATCH_SIZE, 1, 1])), axis=1),\
           tf.concat((values, tf.tile([[values[:][-1][0]]], [BATCH_SIZE, 1, 1])), axis=1),\
           distorted_image,\
           label


dataset_train_optimized = tf.data.Dataset.range(1).interleave(dataset_generator_fun_train, num_parallel_calls=tf.data.AUTOTUNE)\
                                                  .shuffle(BUFFER_SIZE)\
                                                  .batch(BATCH_SIZE, drop_remainder=True)\
                                                  .map(map_fun_with_time_batchwise, num_parallel_calls=tf.data.AUTOTUNE)\
                                                  .cache()\
                                                  .prefetch(tf.data.AUTOTUNE)
dataset_test_optimized = tf.data.Dataset.range(1).interleave(dataset_generator_fun_test, num_parallel_calls=tf.data.AUTOTUNE)\
                                                 .batch(BATCH_SIZE, drop_remainder=True)\
                                                 .map(map_fun_test_with_time_batchwise, num_parallel_calls=tf.data.AUTOTUNE)\
                                                 .cache()\
                                                 .prefetch(tf.data.AUTOTUNE)

# load the same initialization of weights and re-train with optimized input pipeline
model_cifar_op.load_weights('model_cifar_op.h5')
timeline_Optimized = timelined_benchmark(dataset_train_optimized, dataset_test_optimized, EPOCHS=2)

start time:  505283.709143188
training:

100%|█████████████████████████████████████████| 781/781 [02:03<00:00,  6.34it/s]

testing:

100%|█████████████████████████████████████████| 156/156 [00:22<00:00,  6.95it/s]

Epoch 1, Loss: 1.9210, Accuracy: 30.6198, test Loss: 1.5673, test Accuracy: 42.1174
training:

100%|█████████████████████████████████████████| 781/781 [01:36<00:00,  8.10it/s]

testing:

100%|█████████████████████████████████████████| 156/156 [00:19<00:00,  8.11it/s]

Epoch 2, Loss: 1.5617, Accuracy: 43.8200, test Loss: 1.2972, test Accuracy: 55.3185
Execution time: 261.2892151809647


draw_timeline(timeline_Optimized, "Optimized", min_width=8500)


draw_timeline(timeline_Optimized, "Optimized", min_width=1)


# if files have been opened and read into memory
dataset_train_example = tf.data.Dataset.from_tensor_slices((image, label))\
                                       .shuffle(BUFFER_SIZE)\
                                       .batch(BATCH_SIZE, drop_remainder=True)\
                                       .map(map_fun_batchwise, num_parallel_calls=tf.data.AUTOTUNE)\
                                       .cache()\
                                       .prefetch(tf.data.AUTOTUNE)

# or giving file path with `ImageDataGenerator()`, e.g.
flowers_file_path = tf.keras.utils.get_file('flower_photos', 'https://storage.googleapis.com/download.tensorflow.org/example_image/flower_photos.tgz', untar=True)
img_gen = tf.keras.preprocessing.image.ImageDataGenerator(rescale=1./255, rotation_range=20)
dataset_train_example = tf.data.Dataset.from_generator(
                            lambda: img_gen.flow_from_directory(flowers_file_path),
                            output_types=(tf.float32, tf.float32),
                            output_shapes=([32,256,256,3], [32,5])
                        )
dataset_train_example = dataset_train_example.shuffle(BUFFER_SIZE)\
                                             .batch(BATCH_SIZE, drop_remainder=True)\
                                             .map(map_fun_batchwise, num_parallel_calls=tf.data.AUTOTUNE)\
                                             .cache()\
                                             .prefetch(tf.data.AUTOTUNE)

# or tf.data.Dataset.list_files()
dataset_train_example = tf.data.Dataset.list_files(flowers_file_path+"/*/*.jpg")\
                                       .shuffle(BUFFER_SIZE)\
                                       .batch(BATCH_SIZE, drop_remainder=True)\
                                       .map(map_fun_batchwise, num_parallel_calls=tf.data.AUTOTUNE)\
                                       .cache()\
                                       .prefetch(tf.data.AUTOTUNE)


import os
import warnings
warnings.filterwarnings("ignore")
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2' 

import tensorflow as tf
from tensorflow.keras import utils, datasets, layers, models
from tensorflow.keras.applications.vgg16 import VGG16
from sklearn.utils import shuffle
from sklearn.model_selection import train_test_split
import IPython.display as display
import matplotlib.pyplot as plt
import pathlib
import random
import numpy as np
import matplotlib as mpl
import time

import csv
import pandas as pd
import math
from tqdm import tqdm

import itertools
from collections import defaultdict


# You need to download the prepared data and unzip the file in current path('./')
data_root = pathlib.Path('./oregon_wildlife')

# print the subfolders.
print('classes:')
for item in data_root.iterdir():
    print(item)
    
all_image_paths = list(data_root.glob('*/*'))
all_image_paths = [str(path) for path in all_image_paths]
all_image_paths = shuffle(all_image_paths, random_state=1)
all_image_paths = [path for path in all_image_paths if path[-3:] not in ('gif','bmp')]
image_count = len(all_image_paths)
print('\ntotal img num:', image_count)

classes:
oregon_wildlife/bald_eagle
oregon_wildlife/black_bear
oregon_wildlife/cougar
oregon_wildlife/deer
oregon_wildlife/nutria
oregon_wildlife/raccoon
oregon_wildlife/raven
oregon_wildlife/red_fox
oregon_wildlife/sea_lions
oregon_wildlife/virginia_opossum

total img num: 7168


# random showing 3 iamges for you
for n in range(3):
    image_path = random.choice(all_image_paths)
    display.display(display.Image(image_path, width=200, height=200))
    print(image_path.split('/')[-2])

raven

nutria

raven


# get the label
label_names = sorted(item.name for item in data_root.glob('*/') if item.is_dir())
# total label
n_classes = len(label_names)
print(label_names)

['bald_eagle', 'black_bear', 'cougar', 'deer', 'nutria', 'raccoon', 'raven', 'red_fox', 'sea_lions', 'virginia_opossum']


# get the mapping dict
label_to_index = dict((name, index) for index,name in enumerate(label_names))
index_to_label = dict((index, name) for index,name in enumerate(label_names))
print(label_to_index)

{'bald_eagle': 0, 'black_bear': 1, 'cougar': 2, 'deer': 3, 'nutria': 4, 'raccoon': 5, 'raven': 6, 'red_fox': 7, 'sea_lions': 8, 'virginia_opossum': 9}


# get the label data
all_image_label = [label_to_index[pathlib.Path(path).parent.name] for path in all_image_paths]
print("First 10 label indices: ", all_image_label[:10])

First 10 label indices:  [8, 5, 2, 5, 0, 2, 1, 0, 1, 0]


# Create training and testing sets using an 80-20 split
img_path_train, img_path_test, label_train, label_test = train_test_split(all_image_paths,
                                all_image_label,test_size=0.2,random_state=0)
print('training data: %d'%(len(img_path_train)))
print('testing data: %d'%(len(img_path_test)))

training data: 5734
testing data: 1434


# save (img_path, label) pairs
with open('train.csv', 'w', newline='') as csvfile:
    writer = csv.writer(csvfile)
    writer.writerow(['img_path', 'label'])
    for img_path, label in zip(img_path_train, label_train):
        writer.writerow([img_path, label])
        
with open('test.csv', 'w', newline='') as csvfile:
    writer = csv.writer(csvfile)
    writer.writerow(['img_path', 'label'])
    for img_path, label in zip(img_path_test, label_test):
        writer.writerow([img_path, label])


# Feel free to change IMAGE_SIZE_CROPPED if using random_crop in your data augmentation process, but make sure the input resize back to (300,300,3) before feed into VGG16
IMAGE_SIZE_CROPPED = 224
IMAGE_HEIGHT = 300
IMAGE_WIDTH = 300
IMAGE_DEPTH = 3


# construct a new dataset with time informantion
class TimeMeasuredDataset(tf.data.Dataset):
    # OUTPUT: (steps, timings, counters, img, label)
    OUTPUT_SIGNATURE=(
        tf.TensorSpec(shape=(2, 1), dtype=tf.string), # steps: [("Open",), ("Read",)]
        tf.TensorSpec(shape=(2, 2), dtype=tf.float32), # timings: [(open_enter, open_elapsed), (read_enter, read_elapsed)]
        tf.TensorSpec(shape=(2, 3), dtype=tf.int32), # counters: [(instance_idx, epoch_idx, -1), (instance_idx, epoch_idx, example_idx)]
        tf.TensorSpec(shape=(300,300,3), dtype=tf.float32),
        tf.TensorSpec(shape=(), dtype=tf.int32) # label
    )

    _INSTANCES_COUNTER = itertools.count()  # Number of datasets generated
    _EPOCHS_COUNTER = defaultdict(itertools.count)  # Number of epochs done for each dataset

    def _generator(instance_idx, filename, open_file, read_file):
        epoch_idx = next(TimeMeasuredDataset._EPOCHS_COUNTER[instance_idx])

        # Opening the file
        open_enter = time.perf_counter()
        img_paths, label = open_file(filename)
        open_elapsed = time.perf_counter() - open_enter
        # ----------------
        
        # Reading the file        
        for sample_idx in range(len(img_paths)):
            # Reading data (line, record) from the file
            read_enter = time.perf_counter()
            img = read_file(img_paths[sample_idx])
            read_elapsed = time.perf_counter() - read_enter

            yield (
                [("Open",), ("Read",)],
                [(open_enter, open_elapsed), (read_enter, read_elapsed)],
                [(instance_idx, epoch_idx, -1), (instance_idx, epoch_idx, sample_idx)],
                img,
                label[sample_idx]
            )
            open_enter, open_elapsed = -1., -1.  # Negative values will be filtered


    def __new__(cls, filename, open_file, read_file):
        def generator_func(instance_idx, filename):
            return cls._generator(instance_idx, filename, open_file, read_file)

        return tf.data.Dataset.from_generator(
            generator_func,
            output_signature=cls.OUTPUT_SIGNATURE,
            args=(next(cls._INSTANCES_COUNTER), filename)
        )


def open_file(filename):
    rows = pd.read_csv(filename.decode("utf-8"))
    img_paths = rows['img_path'].tolist()
    label = rows['label'].tolist()
    return img_paths, label

def read_file(image_path):
    img = tf.io.read_file(image_path)
    img = tf.image.decode_jpeg(img, channels=IMAGE_DEPTH)
    img = tf.image.resize(img, (IMAGE_HEIGHT, IMAGE_WIDTH))
    img = tf.cast(img, tf.float32)
    img = tf.divide(img,255.0)
    return img

def dataset_generator_fun_train(*args):
    return TimeMeasuredDataset('train.csv', open_file, read_file)

def dataset_generator_fun_test(*args):
    return TimeMeasuredDataset('test.csv', open_file, read_file)


# feel free to modify these two Settings.
BUFFER_SIZE = 10000
BATCH_SIZE = 1

dataset_train = tf.data.Dataset.range(1).flat_map(dataset_generator_fun_train).batch(BATCH_SIZE, drop_remainder=True)
dataset_test = tf.data.Dataset.range(1).flat_map(dataset_generator_fun_test).batch(BATCH_SIZE, drop_remainder=True)


for steps, timings, counters, img, label in dataset_train.take(1):
    print(steps[0], timings[0], counters[0])
    print(img[0].shape)
    plt.imshow(img[0]) 
    plt.axis('off') 
    plt.show()
    print(index_to_label[label[0].numpy()])

tf.Tensor(
[[b'Open']
 [b'Read']], shape=(2, 1), dtype=string) tf.Tensor(
[[5.0564150e+05 1.3395692e-02]
 [5.0564150e+05 3.0839540e-02]], shape=(2, 2), dtype=float32) tf.Tensor(
[[ 0  0 -1]
 [ 0  0  0]], shape=(2, 3), dtype=int32)
(300, 300, 3)

bald_eagle


base_model = VGG16(
    include_top=False,
    weights='imagenet',
    input_shape=(300, 300, 3),
    pooling=None,
)
for layer in base_model.layers:
    layer.trainable = False

top_model = models.Sequential()
top_model.add(layers.Flatten())
top_model.add(layers.Dense(4096, activation='relu'))
top_model.add(layers.Dropout(0.5))
top_model.add(layers.Dense(1024, activation='relu'))
top_model.add(layers.Dropout(0.5))
top_model.add(layers.Dense(n_classes, activation='softmax'))

wild_model = tf.keras.Model(inputs=base_model.input, outputs=top_model(base_model.output))


wild_model.summary()

Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 input_1 (InputLayer)        [(None, 300, 300, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 300, 300, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 300, 300, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 150, 150, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 150, 150, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 150, 150, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 75, 75, 128)       0         
                                                                 
 block3_conv1 (Conv2D)       (None, 75, 75, 256)       295168    
                                                                 
 block3_conv2 (Conv2D)       (None, 75, 75, 256)       590080    
                                                                 
 block3_conv3 (Conv2D)       (None, 75, 75, 256)       590080    
                                                                 
 block3_pool (MaxPooling2D)  (None, 37, 37, 256)       0         
                                                                 
 block4_conv1 (Conv2D)       (None, 37, 37, 512)       1180160   
                                                                 
 block4_conv2 (Conv2D)       (None, 37, 37, 512)       2359808   
                                                                 
 block4_conv3 (Conv2D)       (None, 37, 37, 512)       2359808   
                                                                 
 block4_pool (MaxPooling2D)  (None, 18, 18, 512)       0         
                                                                 
 block5_conv1 (Conv2D)       (None, 18, 18, 512)       2359808   
                                                                 
 block5_conv2 (Conv2D)       (None, 18, 18, 512)       2359808   
                                                                 
 block5_conv3 (Conv2D)       (None, 18, 18, 512)       2359808   
                                                                 
 block5_pool (MaxPooling2D)  (None, 9, 9, 512)         0         
                                                                 
 sequential_5 (Sequential)   (None, 10)                174078986 
                                                                 
=================================================================
Total params: 188,793,674
Trainable params: 174,078,986
Non-trainable params: 14,714,688
_________________________________________________________________


# save the initialization of weights 
wild_model.save_weights('wild_model.h5')


loss_object = tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
optimizer = tf.keras.optimizers.Adam()

train_loss = tf.keras.metrics.Mean(name='train_loss')
train_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name='train_accuracy')

test_loss = tf.keras.metrics.Mean(name='test_loss')
test_accuracy = tf.keras.metrics.SparseCategoricalAccuracy(name='test_accuracy')


@tf.function
def train_step(image, label):
    with tf.GradientTape() as tape:
        predictions = wild_model(image, training=True)
        loss = loss_object(label, predictions)
    gradients = tape.gradient(loss, wild_model.trainable_variables)
    optimizer.apply_gradients(zip(gradients, wild_model.trainable_variables))

    train_loss(loss)
    train_accuracy(label, predictions)
    
@tf.function
def test_step(image, label):
    predictions = wild_model(image, training=False)
    loss = loss_object(label, predictions)

    test_loss(loss)
    test_accuracy(label, predictions)


def timelined_benchmark(dataset_train, dataset_test, EPOCHS):
    steps_acc = tf.zeros([0, 1], dtype=tf.dtypes.string)
    times_acc = tf.zeros([0, 2], dtype=tf.dtypes.float32)
    values_acc = tf.zeros([0, 3], dtype=tf.dtypes.int32)

    start_time = time.perf_counter()
    print("start time: ", start_time)
    for epoch in range(EPOCHS):
        epoch_enter = time.perf_counter()

        # Reset the metrics at the start of the next epoch
        train_loss.reset_states()
        train_accuracy.reset_states()
        test_loss.reset_states()
        test_accuracy.reset_states()

        tf.print("training:")
        for steps, times, values, image, label in tqdm(dataset_train, total=math.floor(len(img_path_train)/BATCH_SIZE)):
            time.sleep(0.05)
            
            steps_acc = tf.concat([steps_acc, tf.reshape(steps, (steps.shape[0]*steps.shape[1], 1))], axis=0)
            times_acc = tf.concat([times_acc, tf.reshape(times, (times.shape[0]*times.shape[1], 2))], axis=0)
            values_acc = tf.concat([values_acc, tf.reshape(values, (values.shape[0]*values.shape[1], 3))], axis=0)

            # record training time
            train_enter = time.perf_counter()
            train_step(image, label)
            train_elapsed = time.perf_counter() - train_enter
            
            time.sleep(0.05)
            
            train_time = tf.concat([tf.fill([times.shape[0], 1], train_enter), tf.fill([times.shape[0], 1], train_elapsed)], axis=1) # shape=(times.shape[0], 2)
            steps_acc = tf.concat([steps_acc, tf.fill([steps.shape[0], 1], "Train")], axis=0)
            times_acc = tf.concat([times_acc, train_time], axis=0)
            values_acc = tf.concat([values_acc, values[:,-1,:]], axis=0)

        tf.print("testing:")
        for steps, times, values, image, label in tqdm(dataset_test, total=math.floor(len(img_path_test)/BATCH_SIZE)):
            time.sleep(0.05)
            
            steps_acc = tf.concat([steps_acc, tf.reshape(steps, (steps.shape[0]*steps.shape[1], 1))], axis=0)
            times_acc = tf.concat([times_acc, tf.reshape(times, (times.shape[0]*times.shape[1], 2))], axis=0)
            values_acc = tf.concat([values_acc, tf.reshape(values, (values.shape[0]*values.shape[1], 3))], axis=0)

            test_enter = time.perf_counter()
            test_step(image, label)
            test_elapsed = time.perf_counter() - test_enter
            
            time.sleep(0.05)
            
            test_time = tf.concat([tf.fill([times.shape[0], 1], test_enter), tf.fill([times.shape[0], 1], test_elapsed)], axis=1) # shape=(times.shape[0], 2)
            steps_acc = tf.concat([steps_acc, tf.fill([steps.shape[0], 1], "Test")], axis=0)
            times_acc = tf.concat([times_acc, test_time], axis=0)
            values_acc = tf.concat([values_acc, values[:,-1,:]], axis=0)
            
        template = 'Epoch {:0}, Loss: {:.4f}, Accuracy: {:.4f}, test Loss: {:.4f}, test Accuracy: {:.4f}'
        tf.print (template.format(epoch+1,
                               train_loss.result(),
                               train_accuracy.result()*100,
                               test_loss.result(),
                               test_accuracy.result()*100))

        epoch_elapsed = time.perf_counter() - epoch_enter
        steps_acc = tf.concat([steps_acc, [["Epoch"]]], axis=0)
        times_acc = tf.concat([times_acc, [(epoch_enter, epoch_elapsed)]], axis=0)
        values_acc = tf.concat([values_acc, [[-1, epoch, -1]]], axis=0)

    tf.print("Execution time:", time.perf_counter() - start_time)
    return {"steps": steps_acc, "times": times_acc, "values": values_acc}


timeline_Naive = timelined_benchmark(dataset_train, dataset_test, EPOCHS=3)

start time:  505650.195122698
training:

100%|███████████████████████████████████████| 5734/5734 [13:09<00:00,  7.26it/s]

testing:

100%|███████████████████████████████████████| 1434/1434 [03:18<00:00,  7.21it/s]

Epoch 1, Loss: 4.5322, Accuracy: 10.4290, test Loss: 2.3034, test Accuracy: 10.0418
training:

100%|███████████████████████████████████████| 5734/5734 [13:16<00:00,  7.20it/s]

testing:

100%|███████████████████████████████████████| 1434/1434 [03:20<00:00,  7.15it/s]

Epoch 2, Loss: 3.0177, Accuracy: 10.3767, test Loss: 2.3295, test Accuracy: 10.0418
training:

100%|███████████████████████████████████████| 5734/5734 [13:22<00:00,  7.15it/s]


draw_timeline(timeline=timeline_Naive, title="Naive", min_width=3000)


## TODO: build `dataset_train_augmentation` and `dataset_test_augmentation` with transformation
## Remember to define your own map functions with map_decorator before calling map

# dataset_train_augmentation = tf.data.Dataset.range(1). ...
# dataset_test_augmentation = tf.data.Dataset.range(1). ...


# load the same initialization of weights and re-train with optimized input pipeline
wild_model.load_weights('wild_model.h5')
timeline_Augmentation = timelined_benchmark(dataset_train_augmentation, dataset_test_augmentation, EPOCHS=3)


draw_timeline(timeline=timeline_Augmentation, title="Augmentation", min_width=3000)


## TODO: build `dataset_train_optimized` and `dataset_test_optimized` with transformation and optimzation
## Remember to re-define your own map functions again to make mapping time re-calculated

# dataset_train_optimized = tf.data.Dataset.range(1). ...
# dataset_test_optimized = tf.data.Dataset.range(1). ...


# load the same initialization of weights and re-train with optimized input pipeline
wild_model.load_weights('wild_model.h5')
timeline_Optimized = timelined_benchmark(dataset_train_optimized, dataset_test_optimized, EPOCHS=3)


draw_timeline(timeline=timeline_Optimized, title="Optimized", min_width=3000)

Convolution Neural Networks¶

MNIST¶

Softmax Regression on MNIST¶

Multilayer Convolutional Network on MNIST¶

Create the convolutional base¶

Add Dense layers on top¶

Compile and train the model¶

Cifar-10¶

Feature Selection¶

K Nearest Neighbors (KNN) on CIFAR-10¶

Support Vector Machine (SVM) on CIFAR-10¶

CNN on CIFAR-10¶

Input Pipeline¶

Structure of an input pipeline¶

tf.data API¶

Construct your Dataset¶

Consume elements¶

Apply transformations¶

map¶

shuffle¶

batch¶

repeat¶

prefetch¶

repeat+batch / batch+repeat¶

shufflt+repeat / repeat+shufflt¶

CNN Model for CIFAR 10¶

Loading Data Manually¶

Optimization for input pipeline¶

Dataset with time¶

Map function with time¶

Re-train CNN with time¶

optimization dataset pipeline¶

Note that since we are vectorizing map function, there's one more dimension for batch in each inputs when mapping. Therefore, we have to modify map function first:¶

in practical use (a simple demo)¶

Assignment¶

Description of Dataset:¶

Requirement:¶

Note:¶

Notification:¶