# All necessary imports
import tensorflow as tf
from tensorflow import keras
from keras import layers
import tensorflow_datasets as tfds

import math
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd

# Downloading the dataset...
ds = tfds.as_numpy(tfds.load(
    'moving_mnist',
    split='test',
    batch_size=-1
))
sequences = ds['image_sequence']

# ...and fixing its dimensions while also normalizing, as was done in the example notebook.
sequences = np.squeeze(np.swapaxes(sequences, 1, 4),axis=1)/255.
print(sequences.shape)
print(np.min(sequences),np.max(sequences))

(10000, 64, 64, 20)
0.0 1.0

# Reordering the axes for easy access during training
trainset = np.expand_dims(sequences[:8000].transpose(0,3,1,2), axis=4)
valset = np.expand_dims(sequences[8000:9000].transpose(0,3,1,2), axis=4)
testset = np.expand_dims(sequences[9000:10000].transpose(0,3,1,2), axis=4)
print(trainset.shape)

(8000, 20, 64, 64, 1)

# Precisely splitting the dataset so to have 40000 series of 3 images + 40000 target frames...
x_train = np.concatenate([trainset[:,:3,:,:,:], trainset[:,4:7,:,:,:], trainset[:,8:11,:,:,:], trainset[:,12:15,:,:,:], trainset[:,16:19,:,:,:]], axis=0)
y_train = np.concatenate([trainset[:,3:4,:,:,:], trainset[:,7:8,:,:,:], trainset[:,11:12,:,:,:], trainset[:,15:16,:,:,:], trainset[:,19:20,:,:,:]], axis=0)
print(x_train.shape, y_train.shape)
x_val = np.concatenate([valset[:,:3,:,:,:], valset[:,4:7,:,:,:], valset[:,8:11,:,:,:], valset[:,12:15,:,:,:], valset[:,16:19,:,:,:]], axis=0)
y_val = np.concatenate([valset[:,3:4,:,:,:], valset[:,7:8,:,:,:], valset[:,11:12,:,:,:], valset[:,15:16,:,:,:], valset[:,19:20,:,:,:]], axis=0)
x_test = np.concatenate([testset[:,:3,:,:,:], testset[:,4:7,:,:,:], testset[:,8:11,:,:,:], testset[:,12:15,:,:,:], testset[:,16:19,:,:,:]], axis=0)
y_test = np.concatenate([testset[:,3:4,:,:,:], testset[:,7:8,:,:,:], testset[:,11:12,:,:,:], testset[:,15:16,:,:,:], testset[:,19:20,:,:,:]], axis=0)

(40000, 3, 64, 64, 1) (40000, 1, 64, 64, 1)

# ...and shuffling it among the 3 sets, using a numpy permutation in order to preserve the x-y correlation
ind_1 = np.random.permutation(x_train.shape[0])
ind_2 = np.random.permutation(x_val.shape[0])
ind_3 = np.random.permutation(x_test.shape[0])

DATASET_SIZE = 40000 # This can be used to reduce the dataset size, useful for example during model selection

x_train = x_train[ind_1, :, :, :][0:DATASET_SIZE]
y_train = y_train[ind_1, :, :, :][0:DATASET_SIZE]
x_val = x_val[ind_2, :, :, :, :][0:int(DATASET_SIZE/8)]
y_val = y_val[ind_2, :, :, :, :][0:int(DATASET_SIZE/8)]
x_test = x_test[ind_3, :, :, :, :][0:int(DATASET_SIZE/8)]
y_test = y_test[ind_3, :, :, :, :][0:int(DATASET_SIZE/8)]

print(x_train.shape, y_train.shape)

(40000, 3, 64, 64, 1) (40000, 1, 64, 64, 1)

EPOCHS = 5 # Number of training epochs, I actually did 10 total running the code twice and using checkpoints

model = keras.models.Sequential() # Model defined as explained above
model.add(layers.Input(shape=(None,64,64,1)))
model.add(layers.ConvLSTM2D(filters=128, kernel_size=(9,9), 
                            padding="same", return_sequences=True, activation="relu"))
model.add(layers.BatchNormalization())
model.add(layers.ConvLSTM2D(filters=128, kernel_size=(5, 5), 
                            padding="same", return_sequences=True, activation="relu"))
model.add(layers.BatchNormalization())
model.add(layers.ConvLSTM2D(filters=128, kernel_size=(1, 1), 
                            padding="same", return_sequences=True, activation="relu"))
model.add(layers.Conv3D(filters=1, kernel_size=(4, 4, 4), activation="sigmoid", padding="same"))

model.compile(loss='mean_squared_error', optimizer=keras.optimizers.Adam(learning_rate=0.001))

checkpoint_filepath = 'tmp/checkpoint_3D_3' # Path for the 2nd checkpoint
model_checkpoint_callback = tf.keras.callbacks.ModelCheckpoint(
    filepath=checkpoint_filepath,
    save_weights_only=True,
    monitor='val_loss',
    mode='min', 
    save_best_only=True)

model.load_weights('tmp/checkpoint_3D_2')  # <--- Used to resume checkpoint
history = model.fit(x_train, y_train, batch_size=10, epochs=EPOCHS, validation_data=(x_val, y_val),
                   callbacks=[model_checkpoint_callback])

Epoch 1/5
4000/4000 [==============================] - 4322s 1s/step - loss: 0.0094 - val_loss: 0.0099
Epoch 2/5
4000/4000 [==============================] - 4328s 1s/step - loss: 0.0091 - val_loss: 0.0100
Epoch 3/5
4000/4000 [==============================] - 4308s 1s/step - loss: 0.0089 - val_loss: 0.0099
Epoch 4/5
4000/4000 [==============================] - 4297s 1s/step - loss: 0.0087 - val_loss: 0.0099
Epoch 5/5
4000/4000 [==============================] - 4380s 1s/step - loss: 0.0085 - val_loss: 0.0099

x = model.predict(x_val[0:10])             # Predict a random section of the test set 
mse = tf.keras.losses.MeanSquaredError()

fig, ax = plt.subplots(2, 4, figsize=(16,10))
for i in range(2):
    ax[i][0].imshow(y_val[i, 0, :, :,:])
    ax[i][0].set_title('Target')
    for j in range(3):
        ax[i][j+1].imshow(x[i, j, :, :,:])
        ax[i][j+1].set_title('Image ' + str(j+1))

1/1 [==============================] - 0s 36ms/step

model.load_weights('tmp/checkpoint_3D_3')  # <--- Load weights of the best model in training w.r.t. val_loss
y_pred = model.predict(x_val)

157/157 [==============================] - 353s 2s/step

MSE_1 = mse(y_val[:, 0, :, :,:], y_pred[:, 0, :, :,:]).numpy()
MSE_2 = mse(y_val[:, 0, :, :,:], y_pred[:, 1, :, :,:]).numpy()
MSE_3 = mse(y_val[:, 0, :, :,:], y_pred[:, 2, :, :,:]).numpy()
print("Best MSE is", min(MSE_1, MSE_2, MSE_3), "of image n.", np.argmin([MSE_1, MSE_2, MSE_3]) + 1)

Best MSE is 0.009905176 of image n. 2

def custom_predict(M, X):   
    Y = M.predict(X)
    return Y[:, 1:2, :, :,:] # Very simply, use the standard prediction function and return only the second image.

y_test_pred = custom_predict(model, x_test)
MSE_test = mse(y_test, y_test_pred).numpy()
print("Final result is an MSE of", MSE_test) # Final score for this model!

157/157 [==============================] - 354s 2s/step
Final result is an MSE of 0.010013093

# A bit of visualization of the model's results
fig, ax = plt.subplots(4, 4, figsize=(16,17))
fig.suptitle('4th image is prediction')
OFFSET = 100
for i in range(4):
    ax[i][0].imshow(x_test[i+OFFSET, 0, :, :,:])
    ax[i][1].imshow(x_test[i+OFFSET, 1, :, :,:])
    ax[i][2].imshow(x_test[i+OFFSET, 2, :, :,:])
    ax[i][3].imshow(y_test_pred[i+OFFSET, 0, :, :,:])

# Precisely splitting the dataset so to have 32000 series of 3 images this time, + 32000 target frames...
x_train_2 = np.concatenate([trainset[:,2:5,:,:,:], trainset[:,6:9,:,:,:], trainset[:,10:13,:,:,:], trainset[:,14:17,:,:,:]], axis=0)
y_train_2 = np.concatenate([trainset[:,5:6,:,:,:], trainset[:,9:10,:,:,:], trainset[:,13:14,:,:,:], trainset[:,17:18,:,:,:]], axis=0)
print(x_train_2.shape, y_train_2.shape)
x_val_2 = np.concatenate([valset[:,2:5,:,:,:], valset[:,6:9,:,:,:], valset[:,10:13,:,:,:], valset[:,14:17,:,:,:]], axis=0)
y_val_2 = np.concatenate([valset[:,5:6,:,:,:], valset[:,9:10,:,:,:], valset[:,13:14,:,:,:], valset[:,17:18,:,:,:]], axis=0)

(32000, 3, 64, 64, 1) (32000, 1, 64, 64, 1)

# ...and shuffling it among the 3 sets, using a numpy permutation in order to preserve the x-y correlation
ind_1 = np.random.permutation(x_train_2.shape[0])
ind_2 = np.random.permutation(x_val_2.shape[0])
ind_3 = np.random.permutation(x_test_2.shape[0])

DATASET_SIZE = x_train_2.shape[0] # This can be used to reduce the dataset size, useful for example during model selection

x_train_2 = x_train_2[ind_1, :, :, :][0:DATASET_SIZE]
y_train_2 = y_train_2[ind_1, :, :, :][0:DATASET_SIZE]
x_val_2 = x_val_2[ind_2, :, :, :, :][0:int(DATASET_SIZE/8)]
y_val_2 = y_val_2[ind_2, :, :, :, :][0:int(DATASET_SIZE/8)]

print(x_train_2.shape, y_train_2.shape)

(32000, 3, 64, 64, 1) (32000, 1, 64, 64, 1)

EPOCHS = 5 # Number of training epochs, I actually only did 5 this time since the model was already partially trained

model_2 = keras.models.Sequential() # Model defined exactly as the previous one
model_2.add(layers.Input(shape=(None,64,64,1)))
model_2.add(layers.ConvLSTM2D(filters=128, kernel_size=(9,9), 
                            padding="same", return_sequences=True, activation="relu"))
model_2.add(layers.BatchNormalization())
model_2.add(layers.ConvLSTM2D(filters=128, kernel_size=(5, 5), 
                            padding="same", return_sequences=True, activation="relu"))
model_2.add(layers.BatchNormalization())
model_2.add(layers.ConvLSTM2D(filters=128, kernel_size=(1, 1), 
                            padding="same", return_sequences=True, activation="relu"))
model_2.add(layers.Conv3D(filters=1, kernel_size=(4, 4, 4), activation="sigmoid", padding="same"))

model_2.compile(loss='mean_squared_error', optimizer=keras.optimizers.Adam(learning_rate=0.001))

checkpoint_filepath_2 = 'tmp/checkpoint_3D_custom' # Path for the second checkpoint
model_checkpoint_callback_2 = tf.keras.callbacks.ModelCheckpoint(
    filepath=checkpoint_filepath_2,
    save_weights_only=True,
    monitor='val_loss',
    mode='min', 
    save_best_only=True)

model_2.load_weights('tmp/checkpoint_3D_3')  # <--- Used to resume checkpoint of the previous model
history = model_2.fit(x_train_2, y_train_2, batch_size=10, epochs=EPOCHS, validation_data=(x_val_2, y_val_2),
                   callbacks=[model_checkpoint_callback_2])

Epoch 1/5
3200/3200 [==============================] - 3497s 1s/step - loss: 0.0098 - val_loss: 0.0098
Epoch 2/5
3200/3200 [==============================] - 3514s 1s/step - loss: 0.0094 - val_loss: 0.0095
Epoch 3/5
3200/3200 [==============================] - 3545s 1s/step - loss: 0.0091 - val_loss: 0.0097
Epoch 4/5
3200/3200 [==============================] - 3486s 1s/step - loss: 0.0089 - val_loss: 0.0096
Epoch 5/5
3200/3200 [==============================] - 3482s 1s/step - loss: 0.0086 - val_loss: 0.0096

model_2.load_weights('tmp/checkpoint_3D_custom')  # <--- Load weights of the best model in training w.r.t. val_loss
y_test_pred_2 = custom_predict(model_2, x_test)
MSE_test_2 = mse(y_test, y_test_pred_2).numpy()
print("Final result is an MSE of", MSE_test_2) # Final score for this model!

157/157 [==============================] - 226s 1s/step
Final result is an MSE of 0.009755889

# A bit of visualization of the model's results
fig, ax = plt.subplots(4, 4, figsize=(16,17))
fig.suptitle('4th image is prediction')
OFFSET = 50
for i in range(4):
    ax[i][0].imshow(x_test[i+OFFSET, 0, :, :,:])
    ax[i][1].imshow(x_test[i+OFFSET, 1, :, :,:])
    ax[i][2].imshow(x_test[i+OFFSET, 2, :, :,:])
    ax[i][3].imshow(y_test_pred_2[i+OFFSET, 0, :, :,:])

X_post = custom_predict(model_2, x_train) # Create a dataset for the new model...
print(X_post.shape)

1250/1250 [==============================] - 1819s 1s/step
(40000, 1, 64, 64, 1)

X_val_post = custom_predict(model_2, x_val) # ...alongside a Validation set
print(X_val_post.shape)

157/157 [==============================] - 227s 1s/step
(5000, 1, 64, 64, 1)

X_post = np.reshape(X_post, (40000, 64, 64, 1))  # No more series, so the timesteps dimension is useless
y_post = np.reshape(y_train, (40000, 64, 64, 1))
X_val_post = np.reshape(X_val_post, (5000, 64, 64, 1))
y_val_post = np.reshape(y_val, (5000, 64, 64, 1))

model_post = keras.models.Sequential()
model_post.add(layers.Conv2D(64, (3, 3), input_shape=(64, 64, 1), activation='relu', padding='same'))
model_post.add(layers.MaxPooling2D(pool_size=(2, 2)))
model_post.add(layers.Conv2D(128, (3, 3), activation='relu', padding='same'))
model_post.add(layers.BatchNormalization())
model_post.add(layers.Conv2D(128, (3, 3), activation='relu', padding='same'))
model_post.add(layers.UpSampling2D((2, 2)))
model_post.add(layers.Conv2D(1, (3, 3), activation='sigmoid', padding='same'))

checkpoint_filepath_post = 'tmp/checkpoint_post' # Path for the new model's checkpoint
model_checkpoint_callback_post = tf.keras.callbacks.ModelCheckpoint(
    filepath=checkpoint_filepath_post,
    save_weights_only=True,
    monitor='val_loss',
    mode='min', 
    save_best_only=True)
model_post.compile(loss='mean_squared_error', optimizer='adam')

model_post.fit(X_post, y_post, batch_size=10, epochs=10, validation_data=(X_val_post, y_val_post),
              callbacks=[model_checkpoint_callback_post])

Epoch 1/10
4000/4000 [==============================] - 36s 9ms/step - loss: 0.0095 - val_loss: 0.0097
Epoch 2/10
4000/4000 [==============================] - 34s 8ms/step - loss: 0.0091 - val_loss: 0.0095
Epoch 3/10
4000/4000 [==============================] - 34s 8ms/step - loss: 0.0090 - val_loss: 0.0095
Epoch 4/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0090 - val_loss: 0.0095
Epoch 5/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0089 - val_loss: 0.0094
Epoch 6/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0088 - val_loss: 0.0094
Epoch 7/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0088 - val_loss: 0.0093
Epoch 8/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0088 - val_loss: 0.0093
Epoch 9/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0087 - val_loss: 0.0093
Epoch 10/10
4000/4000 [==============================] - 34s 9ms/step - loss: 0.0087 - val_loss: 0.0093

<keras.callbacks.History at 0x2303099d930>

X_post_2 = custom_predict(model_2, x_train_2)    # Dataset for the second part
X_val_post_2 = custom_predict(model_2, x_val_2)

1000/1000 [==============================] - 1433s 1s/step
125/125 [==============================] - 176s 1s/step

X_post_2 = np.reshape(X_post_2, (32000, 64, 64, 1))   # Reshaping again
y_post_2 = np.reshape(y_train_2, (32000, 64, 64, 1))
X_val_post_2 = np.reshape(X_val_post_2, (4000, 64, 64, 1))
y_val_post_2 = np.reshape(y_val_2, (4000, 64, 64, 1))

model_post.load_weights('tmp/checkpoint_post')
checkpoint_filepath_post_2 = 'tmp/checkpoint_post_2' # Path for the final checkpoint
model_checkpoint_callback_post_2 = tf.keras.callbacks.ModelCheckpoint(
    filepath=checkpoint_filepath_post_2,
    save_weights_only=True,
    monitor='val_loss',
    mode='min', 
    save_best_only=True)
model_post.fit(X_post_2, y_post_2, batch_size=10, epochs=10, validation_data=(X_val_post_2, y_val_post_2),
              callbacks=[model_checkpoint_callback_post_2])

Epoch 1/10
3200/3200 [==============================] - 28s 9ms/step - loss: 0.0085 - val_loss: 0.0091
Epoch 2/10
3200/3200 [==============================] - 28s 9ms/step - loss: 0.0084 - val_loss: 0.0091
Epoch 3/10
3200/3200 [==============================] - 28s 9ms/step - loss: 0.0084 - val_loss: 0.0091
Epoch 4/10
3200/3200 [==============================] - 28s 9ms/step - loss: 0.0084 - val_loss: 0.0091
Epoch 5/10
3200/3200 [==============================] - 27s 9ms/step - loss: 0.0083 - val_loss: 0.0091
Epoch 6/10
3200/3200 [==============================] - 28s 9ms/step - loss: 0.0083 - val_loss: 0.0091
Epoch 7/10
3200/3200 [==============================] - 28s 9ms/step - loss: 0.0083 - val_loss: 0.0092
Epoch 8/10
3200/3200 [==============================] - 27s 9ms/step - loss: 0.0082 - val_loss: 0.0091
Epoch 9/10
3200/3200 [==============================] - 27s 9ms/step - loss: 0.0082 - val_loss: 0.0091
Epoch 10/10
3200/3200 [==============================] - 27s 9ms/step - loss: 0.0082 - val_loss: 0.0091

<keras.callbacks.History at 0x230f8a64700>

x_test_pred = custom_predict(model_2, x_test)
x_test_post = np.reshape(x_test_pred, (5000, 64, 64, 1))

157/157 [==============================] - 229s 1s/step

model_post.load_weights('tmp/checkpoint_post_2') # Let's load the best checkpoint and visualize the results
predica = model_post.predict(x_test_post)
fig, ax = plt.subplots(3, 3, figsize=(16,16))
OFFSET = 50
for i in range(3):
    ax[i][0].imshow(x_test_post[i+OFFSET, :, :,:])
    ax[i][0].set_title('Original')
    ax[i][1].imshow(predica[i+OFFSET, :, :,:])
    ax[i][1].set_title('Prediction')
    ax[i][2].imshow(y_test[i+OFFSET, 0, :, :,:])
    ax[i][2].set_title('Target')

157/157 [==============================] - 1s 8ms/step

MSE_test_3 = mse(np.reshape(y_test, (5000, 64, 64, 1)), predica).numpy()
print("Final result is an MSE of", MSE_test_3) # Final score for this model!

Final result is an MSE of 0.009298838

def final_predict(X):   # Function defined to do a whole prediction step in one single call
    temp_pred = custom_predict(model_2, X)
    shape = temp_pred.shape
    temp_pred = np.reshape(temp_pred, (shape[0], shape[2], shape[3], shape[4]))
    return model_post.predict(temp_pred)

final_test = final_predict(x_test[0:4])
fig, ax = plt.subplots(4, 2, figsize=(10,16))
for i in range(4):
    ax[i][0].imshow(final_test[i, :, :,:])
    ax[i][0].set_title('Prediction')
    ax[i][1].imshow(y_test[i, 0, :, :,:])
    ax[i][1].set_title('Target')

1/1 [==============================] - 0s 28ms/step
1/1 [==============================] - 0s 16ms/step

July 2023 Deep Learning Project¶

Moving MNIST: a sequence prediction task¶

MSE = 0.00975¶

FINAL SCORE: MSE = 0.0092988¶