#
# Copyright 2016 The BigDL Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# MNIST CNN Example on BigDL
# Reference: https://github.com/fchollet/keras/blob/1.2.2/examples/mnist_cnn.py
# ../../models/lenet/lenet5.py
# The Keras version we support and test is Keras 1.2.2 with TensorFlow backend.
# See README.md for how to run this example.
from optparse import OptionParser
from bigdl.examples.keras.keras_utils import *
import keras.backend
if keras.backend.image_dim_ordering() == "th":
input_shape = (1, 28, 28)
else:
input_shape = (28, 28, 1)
[docs]def get_mnist(sc, data_type="train", location="/tmp/mnist"):
"""
Download or load MNIST dataset to/from the specified path.
Normalize and transform input data into an RDD of Sample
"""
from bigdl.dataset import mnist
from bigdl.dataset.transformer import normalizer
(images, labels) = mnist.read_data_sets(location, data_type)
images = images.reshape((images.shape[0], ) + input_shape)
images = sc.parallelize(images)
labels = sc.parallelize(labels + 1) # Target start from 1 in BigDL
record = images.zip(labels).map(lambda rec_tuple: (normalizer(rec_tuple[0], mnist.TRAIN_MEAN, mnist.TRAIN_STD),
rec_tuple[1])) \
.map(lambda t: Sample.from_ndarray(t[0], t[1]))
return record
[docs]def build_keras_model():
"""
Define a convnet model in Keras 1.2.2
"""
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten
from keras.layers import Convolution2D, MaxPooling2D
keras_model = Sequential()
keras_model.add(Convolution2D(32, 3, 3, border_mode='valid',
input_shape=input_shape))
keras_model.add(Activation('relu'))
keras_model.add(Convolution2D(32, 3, 3))
keras_model.add(Activation('relu'))
keras_model.add(MaxPooling2D(pool_size=(2, 2)))
keras_model.add(Dropout(0.25))
keras_model.add(Flatten())
keras_model.add(Dense(128))
keras_model.add(Activation('relu'))
keras_model.add(Dropout(0.5))
keras_model.add(Dense(10))
keras_model.add(Activation('softmax'))
return keras_model
if __name__ == "__main__":
parser = OptionParser()
parser.add_option("-b", "--batchSize", type=int, dest="batchSize", default="128")
parser.add_option("-m", "--max_epoch", type=int, dest="max_epoch", default="12")
parser.add_option("-d", "--dataPath", dest="dataPath", default="/tmp/mnist")
(options, args) = parser.parse_args(sys.argv)
keras_model = build_keras_model()
json_path = "/tmp/lenet.json"
save_keras_definition(keras_model, json_path)
from bigdl.util.common import *
from bigdl.nn.layer import *
from bigdl.optim.optimizer import *
from bigdl.nn.criterion import *
# Load the JSON file to a BigDL model
bigdl_model = Model.load_keras(json_path=json_path)
sc = get_spark_context(conf=create_spark_conf())
redire_spark_logs()
show_bigdl_info_logs()
init_engine()
train_data = get_mnist(sc, "train", options.dataPath)
test_data = get_mnist(sc, "test", options.dataPath)
optimizer = Optimizer(
model=bigdl_model,
training_rdd=train_data,
criterion=ClassNLLCriterion(logProbAsInput=False),
optim_method=Adadelta(),
end_trigger=MaxEpoch(options.max_epoch),
batch_size=options.batchSize)
optimizer.set_validation(
batch_size=options.batchSize,
val_rdd=test_data,
trigger=EveryEpoch(),
val_method=[Top1Accuracy()]
)
optimizer.optimize()