Converted mnist notebook to keras (4f05c690) · Commits · 钟慕尧 / deepchem

examples/notebooks/mnist.ipynb

+29 −42

Original line number	Diff line number	Diff line
		%% Cell type:markdown id: tags:

		# MNIST with DeepChem and TensorGraph

		%% Cell type:code id: tags:

		``` python
		from tensorflow.examples.tutorials.mnist import input_data
		```

		%% Cell type:code id: tags:

		``` python
		mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)
		```

		%% Output

		Extracting MNIST_data/train-images-idx3-ubyte.gz
		Extracting MNIST_data/train-labels-idx1-ubyte.gz
		Extracting MNIST_data/t10k-images-idx3-ubyte.gz
		Extracting MNIST_data/t10k-labels-idx1-ubyte.gz

		%% Cell type:code id: tags:

		``` python
		import deepchem as dc
		import tensorflow as tf
		from deepchem.models.tensorgraph.layers import Layer, Input, Reshape, Flatten, Conv2D, Label, Feature
		from deepchem.models.tensorgraph.layers import Dense, SoftMaxCrossEntropy, ReduceMean, SoftMax
		from tensorflow.keras.layers import Reshape, Conv2D, Flatten, Dense, Softmax
		```

		%% Cell type:code id: tags:

		``` python
		train = dc.data.NumpyDataset(mnist.train.images, mnist.train.labels)
		valid = dc.data.NumpyDataset(mnist.validation.images, mnist.validation.labels)
		```

		%% Cell type:code id: tags:

		``` python
		tg = dc.models.TensorGraph(tensorboard=True, model_dir='/tmp/mnist', use_queue=False)
		feature = Feature(shape=(None, 784))

		# Images are square 28x28 (batch, height, width, channel)
		make_image = Reshape(shape=(-1, 28, 28, 1), in_layers=[feature])

		conv2d_1 = Conv2D(num_outputs=32, in_layers=[make_image])

		conv2d_2 = Conv2D(num_outputs=64, in_layers=[conv2d_1])

		flatten = Flatten(in_layers=[conv2d_2])

		dense1 = Dense(out_channels=1024, activation_fn=tf.nn.relu, in_layers=[flatten])

		dense2 = Dense(out_channels=10, in_layers=[dense1])

		label = Label(shape=(None, 10))

		smce = SoftMaxCrossEntropy(in_layers=[label, dense2])
		loss = ReduceMean(in_layers=[smce])
		tg.set_loss(loss)

		output = SoftMax(in_layers=[dense2])
		tg.add_output(output)
		keras_model = tf.keras.Sequential([
		Reshape((28, 28, 1)),
		Conv2D(filters=32, kernel_size=5, activation=tf.nn.relu),
		Conv2D(filters=64, kernel_size=5, activation=tf.nn.relu),
		Flatten(),
		Dense(1024, activation=tf.nn.relu),
		Dense(10),
		Softmax()
		])
		model = dc.models.KerasModel(keras_model, dc.models.losses.CategoricalCrossEntropy())
		```

		%% Cell type:code id: tags:

		``` python
		# nb_epoch set to 0 to permit rendering of tutorials online.
		# Set nb_epoch=10 for better results
		tg.fit(train, nb_epoch=0)
		model.fit(train, nb_epoch=2)
		```

		%% Output

		TIMING: model fitting took 2.621 s
		0.0

		%% Cell type:code id: tags:

		``` python
		# Note that AUCs will be nonsensical without setting nb_epoch higher!
		from sklearn.metrics import roc_curve, auc
		import numpy as np

		print("Validation")
		prediction = np.squeeze(tg.predict_on_batch(valid.X))
		prediction = np.squeeze(model.predict_on_batch(valid.X))

		fpr = dict()
		tpr = dict()
		roc_auc = dict()
		for i in range(10):
		fpr[i], tpr[i], thresh = roc_curve(valid.y[:, i], prediction[:, i])
		roc_auc[i] = auc(fpr[i], tpr[i])
		print("class %s:auc=%s" % (i, roc_auc[i]))
		```

		%% Output

		Validation
		class 0:auc=0.170555039138
		class 1:auc=0.634619025945
		class 2:auc=0.303693111629
		class 3:auc=0.549712392397
		class 4:auc=0.523565007169
		class 5:auc=0.648496399959
		class 6:auc=0.316489936331
		class 7:auc=0.708521348315
		class 8:auc=0.555897147512
		class 9:auc=0.377021042837
		class 0:auc=0.9999515136738367
		class 1:auc=0.999956365633573
		class 2:auc=0.9998060726950355
		class 3:auc=0.9999626454408761
		class 4:auc=0.9999271593180605
		class 5:auc=0.9999116894861034
		class 6:auc=0.9999347825797615
		class 7:auc=0.9998377936670072
		class 8:auc=0.9999093751848269
		class 9:auc=0.9996134485812621

		%% Cell type:code id: tags:

		``` python
		```

Admin message