import tensorflow as tf
from tensorflow.keras import layers
from tensorflow.keras.models import Model
from tensorflow.keras.optimizers import Adam

# size of our encoded representations
encoding_dim = 16 
mid_dim = 64

# input placeholder
input_img = layers.Input(shape=(784,))
# "encoded" is the encoded representation of the input
encoded = layers.Dense(mid_dim, activation='relu')(input_img)
encoded = layers.Dense(encoding_dim, activation='relu')(encoded)
# "decoded" is the lossy reconstruction of the input
decoded = layers.Dense(mid_dim, activation='relu')(encoded)
decoded = layers.Dense(784, activation='sigmoid')(decoded)

# this model maps an input to its reconstruction
autoencoder = Model(input_img, decoded)

autoencoder.summary()

Model: "model_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
=================================================================
input_2 (InputLayer)         [(None, 784)]             0         
_________________________________________________________________
dense_4 (Dense)              (None, 64)                50240     
_________________________________________________________________
dense_5 (Dense)              (None, 16)                1040      
_________________________________________________________________
dense_6 (Dense)              (None, 64)                1088      
_________________________________________________________________
dense_7 (Dense)              (None, 784)               50960     
=================================================================
Total params: 103,328
Trainable params: 103,328
Non-trainable params: 0
_________________________________________________________________

adam = Adam(lr=0.001)
autoencoder.compile(optimizer=adam, loss='mse')

from keras.datasets import mnist
import numpy as np
(x_train, _), (x_test, _) = mnist.load_data()

x_train = x_train.astype('float32') / 255.
x_test = x_test.astype('float32') / 255.
x_train = x_train.reshape((len(x_train), np.prod(x_train.shape[1:])))
x_test = x_test.reshape((len(x_test), np.prod(x_test.shape[1:])))
print(x_train.shape)
print(x_test.shape)

(60000, 784)
(10000, 784)

autoencoder.fit(x_train, x_train,
                epochs=20,
                batch_size=256,
                shuffle=True,
                validation_data=(x_test, x_test))

Epoch 1/20
235/235 [==============================] - 1s 4ms/step - loss: 0.0165 - val_loss: 0.0160
Epoch 2/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0163 - val_loss: 0.0159
Epoch 3/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0162 - val_loss: 0.0158
Epoch 4/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0161 - val_loss: 0.0157
Epoch 5/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0160 - val_loss: 0.0157
Epoch 6/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0159 - val_loss: 0.0156
Epoch 7/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0159 - val_loss: 0.0156
Epoch 8/20
235/235 [==============================] - 1s 4ms/step - loss: 0.0158 - val_loss: 0.0154
Epoch 9/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0158 - val_loss: 0.0154
Epoch 10/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0157 - val_loss: 0.0153
Epoch 11/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0156 - val_loss: 0.0153
Epoch 12/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0157 - val_loss: 0.0152
Epoch 13/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0155 - val_loss: 0.0152
Epoch 14/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0154 - val_loss: 0.0153
Epoch 15/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0154 - val_loss: 0.0151
Epoch 16/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0154 - val_loss: 0.0150
Epoch 17/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0153 - val_loss: 0.0150
Epoch 18/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0152 - val_loss: 0.0150
Epoch 19/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0152 - val_loss: 0.0149
Epoch 20/20
235/235 [==============================] - 1s 3ms/step - loss: 0.0152 - val_loss: 0.0149

<tensorflow.python.keras.callbacks.History at 0x7f76c265a1d0>

decoded_imgs = autoencoder.predict(x_test)

import matplotlib.pyplot as plt

n = 10 #no images to plot
imgs = np.random.randint(low=0,high=10000,size=n)
plt.figure(figsize=(20, 4))
for (i,idx) in enumerate(imgs):
    # display original
    ax = plt.subplot(2, n, i + 1)
    plt.imshow(x_test[idx].reshape(28, 28))
    plt.gray()
    ax.get_xaxis().set_visible(False)
    ax.get_yaxis().set_visible(False)

    # display reconstruction
    ax = plt.subplot(2, n, i + 1 + n)
    plt.imshow(decoded_imgs[idx].reshape(28, 28))
    plt.gray()
    ax.get_xaxis().set_visible(False)
    ax.get_yaxis().set_visible(False)
plt.show()

mse_all = np.mean(np.square(decoded_imgs - x_test),axis=1) #mean error for each input
print(mse.shape) 
mse = np.mean(mse_all)
std = np.std(mse_all)
print("mse is {}, with a standard deviation of {}".format(mse,std))

()
mse is 0.01905367523431778, with a standard deviation of 0.009669928811490536

test = x_test[15].reshape(1,784)
print(autoencoder.evaluate(test,test))

plt.figure(figsize=(8,4))
ax = plt.subplot(1,2,1)
plt.imshow(x_test[15].reshape(28, 28))
plt.gray()
ax.get_xaxis().set_visible(False)
ax.get_yaxis().set_visible(False)
ax = plt.subplot(1, 2, 2)
plt.imshow(decoded_imgs[15].reshape(28, 28))
plt.gray()
ax.get_xaxis().set_visible(False)
ax.get_yaxis().set_visible(False)
plt.savefig('lyar1.jpg')
plt.show()

1/1 [==============================] - 0s 16ms/step - loss: 0.0270
0.027014590799808502

rotated = np.rot90(x_test[15].reshape(28,28))
predicted = autoencoder.predict(rotated.reshape(1,784))[0].reshape(28,28)

plt.figure(figsize=(8,4))
ax = plt.subplot(1,2,1)
plt.imshow(rotated)
plt.gray()
ax.get_xaxis().set_visible(False)
ax.get_yaxis().set_visible(False)
ax = plt.subplot(1, 2, 2)
plt.imshow(predicted)
plt.gray()
ax.get_xaxis().set_visible(False)
ax.get_yaxis().set_visible(False)
plt.savefig('lyar2.jpg')
plt.show()

mse = np.mean(np.square(predicted-rotated))
print("mse is {}".format(mse))

mse is 0.052468638867139816

Anomaly detection¶