Installing keras requires
Python (2 for CPU, 3 for GPU).
A virtual environment (virtualenv, anaconda)
Tensorflow is the default option
install_keras(tensorflow = "default")
The MNIST database is a large database of handwritten digits that is commonly used for training various image processing systems.
Handwritten digits are stored as squared matrices of size 28 by 28 (784) pixels. Each pixel has 256 values.
mnist <- dataset_mnist()
x_train <- mnist$train$x
y_train <- mnist$train$y
x_test <- mnist$test$x
y_test <- mnist$test$y
# extract digits 2 and 7 from MNIST and build some training data
boo_train <- y_train == 2 | y_train == 7
x_train <- mnist$train$x[boo_train,,]
y_train <- mnist$train$y[boo_train]
# same for test data
boo_test <- y_test == 2 | y_test == 7
x_test <- mnist$test$x[boo_test,,]
y_test <- mnist$test$y[boo_test]
image(t(x_test[1, 28:1,]), col = grey.colors(5))
# Flattening
x_train <- array_reshape(x_train,
x_test <- array_reshape(x_test,
# Rescaling
x_train <- x_train/255
x_test <- x_test/255
y_train <- as.numeric(y_train == 7)
y_test <- as.numeric(y_test == 7)
model <- keras_model_sequential()
model %>%
layer_dense(units = 128,
activation = 'relu',
input_shape = 784) %>%
layer_dropout(rate = 0.5) %>%
layer_dense(units = 1,
activation = 'sigmoid')
model %>% compile(
loss = 'binary_crossentropy',
optimizer = optimizer_sgd(lr = 0.01,
decay = 0.001),
metrics = c('accuracy')
history <- model %>%
epochs = 20,
batch_size = 100,
validation_data = list(x_test, y_test),
verbose = 0
model %>% evaluate(x_test, y_test)
## $loss
## [1] 0.08389094
## $acc
## [1] 0.9742718
pred_class <- model %>%
table(predicted = pred_class,
observed = mnist$test$y[boo_test])
## observed
## predicted 2 7
## 0 1015 36
## 1 17 992
false_positive <- which(mnist$test$y[boo_test] == 7 & pred_class[,1] == 0)
x_test[false_positive[1],] %>% matrix(nrow = 28) %>% .[,28:1] %>% image(col = grey.colors(5))
pretrained_model = application_resnet50(weights = 'imagenet')
Let’s consider our misclassified example.
img <- mnist$test$x[false_positive[3],,]
x <- array(NA, c(1,28,28,3))
x[1, , ,1:3] <- img
x <- image_array_resize(x, 224, 224)
x <- imagenet_preprocess_input(x)
And see it’s prediction in Imagenet (yes, that’s n’imp)
pred <- pretrained_model %>% predict(x)
imagenet_decode_predictions(pred, top = 4)[[1]]