Merge pull request #925 from rbharath/sequential (ae754761) · Commits · 钟慕尧 / deepchem

deepchem/models/init.py

+1 −1

Original line number	Diff line number	Diff line
		@@ -13,7 +13,6 @@ from deepchem.models.tf_new_models.multitask_regressor import MultitaskGraphRegr

		from deepchem.models.tf_new_models.support_classifier import SupportGraphClassifier
		from deepchem.models.multitask import SingletaskToMultitask
		from deepchem.models.sequential import Sequential

		from deepchem.models.tensorflow_models.fcnet import TensorflowMultiTaskRegressor
		from deepchem.models.tensorflow_models.fcnet import TensorflowMultiTaskClassifier
		@@ -34,3 +33,4 @@ from deepchem.models.tensorgraph.models.symmetry_function_regression import BPSy
		from deepchem.models.tensorgraph.models.seqtoseq import SeqToSeq
		from deepchem.models.tensorgraph.models.gan import GAN, WGAN
		from deepchem.models.tensorgraph.models.text_cnn import TextCNNTensorGraph
		from deepchem.models.tensorgraph.sequential import Sequential

deepchem/models/sequential.py

deleted100644 → 0

+0 −341

Original line number	Diff line number	Diff line
		"""
		Contains Sequential model adapted from keras/keras/models.py.

		This class is adapted from Keras directly. Have cut out functionality
		and changed API to match DeepChem style.
		"""
		from __future__ import print_function
		from __future__ import division
		from __future__ import unicode_literals

		__author__ = "Bharath Ramsundar"
		__copyright__ = "Copyright 2017, Stanford University"
		__license__ = "MIT"

		import time
		import os
		import tempfile
		import numpy as np
		import tensorflow as tf
		from deepchem.models.models import Model
		from deepchem.nn import model_ops
		from deepchem.nn.copy import Layer
		from deepchem.nn.copy import InputLayer


		class Sequential(Model):
		"""Linear stack of layers.

		Parameters
		----------
		layers: list of layers to add to the model.

		Note
		----
		The first layer passed to a Sequential model
		should have a defined input shape. What that
		means is that it should have received an `input_shape`
		or `batch_input_shape` argument,
		or for some type of layers (recurrent, Dense...)
		an `input_dim` argument.

		Example
		-------
		>>> import deepchem as dc
		>>> model = dc.models.Sequential()
		>>> # Add features
		>>> model.add_features(dc.nn.Input(shape=(50,)))
		>>> # Add labels
		>>> model.add_labels(dc.nn.Input(shape=(1,)))
		>>> model.add(dc.nn.Dense(32, 50))
		>>> model.add(dc.nn.Dense(64, 32))
		"""

		def __init__(self, name=None, logdir=None):
		super(Sequential, self).__init__(self, model_dir=logdir)
		self.layers = [] # stack of layers
		self.outputs = None # tensors (length 1)

		if not name:
		prefix = 'sequential_'
		name = prefix + str(model_ops.get_uid(prefix))
		self.name = name
		self.graph = tf.Graph()

		config = tf.ConfigProto(allow_soft_placement=True)
		self.session = tf.Session(graph=self.graph, config=config)
		# Path to save checkpoint files
		self._save_path = os.path.join(self.model_dir, 'model.ckpt')

		def add(self, layer):
		"""Adds a layer instance on top of the layer stack.

		Parameters
		----------
		layer: layer instance.
		"""
		if not isinstance(layer, Layer):
		raise TypeError("The added layer must be an instance of class Layer. "
		"Found: " + str(layer))
		with self.graph.as_default():
		if not self.layers:
		raise ValueError("Call add_features() before calling add()")
		# first layer in model: check that it is an input layer

		else:
		self.outputs = layer(self.outputs)

		self.layers.append(layer)

		def add_features(self, layer):
		"""Adds an input layer."""
		if self.layers:
		raise ValueError(
		"add_features() has to be called before layers are added.")
		if not isinstance(layer, InputLayer):
		raise ValueError("First layer in sequential model must be InputLayer")
		with self.graph.as_default():
		self.features = layer()[0]
		self.outputs = self.features
		self.layers = [layer]

		def add_labels(self, layer):
		"""Adds a layer for labels"""
		with self.graph.as_default():
		self.labels = layer()[0]

		def add_loss(self, loss, inputs=None):
		"""Adds a loss to model.

		Parameters
		----------
		losses: list
		"""
		# Add losses to graph
		with self.graph.as_default():
		# Loss for each batch element
		batch_loss = loss(self.outputs, self.labels)
		# Loss should be a float
		self.loss = tf.reduce_sum(batch_loss)

		@property
		def uses_learning_phase(self):
		return self.uses_learning_phase

		def fit(self,
		dataset,
		nb_epoch=10,
		max_checkpoints_to_keep=5,
		log_every_N_batches=50,
		learning_rate=.001,
		batch_size=50,
		checkpoint_interval=10):
		"""Trains the model for a fixed number of epochs.

		TODO(rbharath0: This is mostly copied from TensorflowGraphModel. Should
		eventually refactor both together.

		Parameters
		----------
		dataset: dc.data.Dataset
		nb_epoch: 10
		Number of training epochs.
		Dataset object holding training data
		batch_size: integer. Number of samples per gradient update.
		nb_epoch: integer, the number of epochs to train the model.
		verbose: 0 for no logging to stdout,
		1 for progress bar logging, 2 for one log line per epoch.
		initial_epoch: epoch at which to start training
		(useful for resuming a previous training run)
		checkpoint_interval: int
		Frequency at which to write checkpoints, measured in epochs
		"""
		############################################################## TIMING
		time1 = time.time()
		############################################################## TIMING
		print("Training for %d epochs" % nb_epoch)
		with self.graph.as_default():
		opt = model_ops.optimizer("adam", learning_rate)
		train_op = opt.minimize(self.loss, name='train')
		with self.session as sess:
		sess.run(tf.global_variables_initializer())
		saver = tf.train.Saver(max_to_keep=max_checkpoints_to_keep)
		# Save an initial checkpoint.
		saver.save(sess, self._save_path, global_step=0)
		for epoch in range(nb_epoch):
		avg_loss, n_batches = 0., 0
		# TODO(rbharath): Don't support example weighting yet.
		for ind, (X_b, y_b, w_b,
		ids_b) in enumerate(dataset.iterbatches(batch_size)):
		if ind % log_every_N_batches == 0:
		print("On batch %d" % ind)
		feed_dict = {self.features: X_b, self.labels: y_b}
		fetches = [self.outputs] + [train_op, self.loss]
		fetched_values = sess.run(fetches, feed_dict=feed_dict)
		output = fetched_values[:1]
		loss = fetched_values[-1]
		avg_loss += loss
		y_pred = np.squeeze(np.array(output))
		y_b = y_b.flatten()
		n_batches += 1
		if epoch % checkpoint_interval == checkpoint_interval - 1:
		saver.save(sess, self._save_path, global_step=epoch)
		avg_loss = float(avg_loss) / n_batches
		print('Ending epoch %d: Average loss %g' % (epoch, avg_loss))
		# Always save a final checkpoint when complete.
		saver.save(sess, self._save_path, global_step=epoch + 1)
		############################################################## TIMING
		time2 = time.time()
		print("TIMING: model fitting took %0.3f s" % (time2 - time1))
		############################################################## TIMING

		def evaluate(self,
		x,
		y,
		batch_size=32,
		verbose=1,
		sample_weight=None,
		**kwargs):
		"""Computes the loss on some input data, batch by batch.

		Parameters
		----------
		x: input data, as a Numpy array or list of Numpy arrays
		(if the model has multiple inputs).
		y: labels, as a Numpy array.
		batch_size: integer. Number of samples per gradient update.
		verbose: verbosity mode, 0 or 1.
		sample_weight: sample weights, as a Numpy array.

		Returns
		-------
		Scalar test loss (if the model has no metrics)
		or list of scalars (if the model computes other metrics).
		The attribute `model.metrics_names` will give you
		the display labels for the scalar outputs.
		"""
		if self.model is None:
		raise RuntimeError('The model needs to be compiled ' 'before being used.')
		if 'show_accuracy' in kwargs:
		kwargs.pop('show_accuracy')
		warnings.warn('The "show_accuracy" argument is deprecated, '
		'instead you should pass the "accuracy" metric to '
		'the model at compile time:\n'
		'`model.compile(optimizer, loss, '
		'metrics=["accuracy"])`')
		if kwargs:
		raise TypeError('Received unknown keyword arguments: ' + str(kwargs))
		return self.model.evaluate(
		x,
		y,
		batch_size=batch_size,
		verbose=verbose,
		sample_weight=sample_weight)

		def predict(self, x, batch_size=32, verbose=0):
		"""Generates output predictions for the input samples,
		processing the samples in a batched way.

		# Arguments
		x: the input data, as a Numpy array.
		batch_size: integer.
		verbose: verbosity mode, 0 or 1.

		# Returns
		A Numpy array of predictions.
		"""
		if self.model is None:
		self.build()
		return self.model.predict(x, batch_size=batch_size, verbose=verbose)

		def predict_on_batch(self, x):
		"""Returns predictions for a single batch of samples.
		"""
		if self.model is None:
		self.build()
		return self.model.predict_on_batch(x)

		def train_on_batch(self,
		x,
		y,
		class_weight=None,
		sample_weight=None,
		**kwargs):
		"""Single gradient update over one batch of samples.

		# Arguments
		x: input data, as a Numpy array or list of Numpy arrays
		(if the model has multiple inputs).
		y: labels, as a Numpy array.
		class_weight: dictionary mapping classes to a weight value,
		used for scaling the loss function (during training only).
		sample_weight: sample weights, as a Numpy array.

		# Returns
		Scalar training loss (if the model has no metrics)
		or list of scalars (if the model computes other metrics).
		The attribute `model.metrics_names` will give you
		the display labels for the scalar outputs.
		"""
		if self.model is None:
		raise RuntimeError('The model needs to be compiled ' 'before being used.')
		if 'accuracy' in kwargs:
		kwargs.pop('accuracy')
		warnings.warn('The "accuracy" argument is deprecated, '
		'instead you should pass the "accuracy" metric to '
		'the model at compile time:\n'
		'`model.compile(optimizer, loss, '
		'metrics=["accuracy"])`')
		if kwargs:
		raise TypeError('Received unknown keyword arguments: ' + str(kwargs))
		return self.model.train_on_batch(
		x, y, sample_weight=sample_weight, class_weight=class_weight)

		def test_on_batch(self, x, y, sample_weight=None, **kwargs):
		"""Evaluates the model over a single batch of samples.

		# Arguments
		x: input data, as a Numpy array or list of Numpy arrays
		(if the model has multiple inputs).
		y: labels, as a Numpy array.
		sample_weight: sample weights, as a Numpy array.

		# Returns
		Scalar test loss (if the model has no metrics)
		or list of scalars (if the model computes other metrics).
		The attribute `model.metrics_names` will give you
		the display labels for the scalar outputs.
		"""
		if self.model is None:
		raise RuntimeError('The model needs to be compiled ' 'before being used.')
		if 'accuracy' in kwargs:
		kwargs.pop('accuracy')
		warnings.warn('The "accuracy" argument is deprecated, '
		'instead you should pass the "accuracy" metric to '
		'the model at compile time:\n'
		'`model.compile(optimizer, loss, '
		'metrics=["accuracy"])`')
		if kwargs:
		raise TypeError('Received unknown keyword arguments: ' + str(kwargs))
		return self.model.test_on_batch(x, y, sample_weight=sample_weight)

		def predict_proba(self, x, batch_size=32, verbose=1):
		"""Generates class probability predictions for the input samples
		batch by batch.

		# Arguments
		x: input data, as a Numpy array or list of Numpy arrays
		(if the model has multiple inputs).
		batch_size: integer.
		verbose: verbosity mode, 0 or 1.

		# Returns
		A Numpy array of probability predictions.
		"""
		preds = self.predict(x, batch_size, verbose)
		if preds.min() < 0. or preds.max() > 1.:
		warnings.warn('Network returning invalid probability values. '
		'The last layer might not normalize predictions '
		'into probabilities '
		'(like softmax or sigmoid would).')
		return preds

deepchem/models/tensorgraph/layers.py

+1 −1

Original line number	Diff line number	Diff line
		@@ -1084,7 +1084,7 @@ class SoftMax(Layer):
		def create_tensor(self, in_layers=None, set_tensors=True, **kwargs):
		inputs = self._get_input_tensors(in_layers)
		if len(inputs) != 1:
		raise ValueError("Must only Softmax single parent")
		raise ValueError("Softmax must have a single input layer.")
		parent = inputs[0]
		out_tensor = tf.contrib.layers.softmax(parent)
		if set_tensors:

deepchem/models/tensorgraph/sequential.py

0 → 100644

+119 −0

Original line number	Diff line number	Diff line
		"""
		Convenience class for building sequential deep networks.
		"""
		from __future__ import print_function
		from __future__ import division
		from __future__ import unicode_literals

		import warnings
		import tensorflow as tf
		from deepchem.models.tensorgraph.tensor_graph import TensorGraph
		from deepchem.models.tensorgraph.layers import Feature
		from deepchem.models.tensorgraph.layers import Label
		from deepchem.models.tensorgraph.layers import SoftMaxCrossEntropy
		from deepchem.models.tensorgraph.layers import ReduceMean
		from deepchem.models.tensorgraph.layers import ReduceSquareDifference


		class Sequential(TensorGraph):
		"""Sequential models are linear stacks of layers.

		Analogous to the Sequential model from Keras and allows for less
		verbose construction of simple deep learning model.

		Example
		-------

		>>> import deepchem as dc
		>>> import numpy as np
		>>> from deepchem.models.tensorgraph import layers
		>>> # Define Data
		>>> X = np.random.rand(20, 2)
		>>> y = [[0, 1] for x in range(20)]
		>>> dataset = dc.data.NumpyDataset(X, y)
		>>> model = dc.models.Sequential(learning_rate=0.01)
		>>> model.add(layers.Dense(out_channels=2))
		>>> model.add(layers.SoftMax())
		"""

		def __init__(self, **kwargs):
		"""Initializes a sequential model
		"""
		self.num_layers = 0
		self._prev_layer = None
		if "use_queue" in kwargs:
		if kwargs["use_queue"]:
		raise ValueError("Sequential doesn't support queues.")
		kwargs["use_queue"] = False
		self._layer_list = []
		self._built = False
		super(Sequential, self).__init__(**kwargs)

		def add(self, layer):
		"""Adds a new layer to model.

		Parameter
		---------
		layer: Layer
		Adds layer to this graph.
		"""
		self._layer_list.append(layer)

		def fit(self, dataset, loss, **kwargs):
		"""Fits on the specified dataset.

		If called for the first time, constructs the TensorFlow graph for this
		model. Fits this graph on the specified dataset according to the specified
		loss.

		Parameters
		----------
		dataset: dc.data.Dataset
		Dataset with data
		loss: string
		Only "binary_crossentropy" or "mse" for now.
		"""
		X_shape, y_shape, _, _ = dataset.get_shape()
		# Calling fit() for first time
		if not self.built:
		feature_shape = X_shape[1:]
		label_shape = y_shape[1:]
		# Add in features
		features = Feature(shape=(None,) + feature_shape)
		# Add in labels
		labels = Label(shape=(None,) + label_shape)

		# Add in all layers
		prev_layer = features
		if len(self._layer_list) == 0:
		raise ValueError("No layers have been added to model.")
		for ind, layer in enumerate(self._layer_list):
		if len(layer.in_layers) > 1:
		raise ValueError("Cannot specify more than one "
		"in_layer for Sequential.")
		layer.in_layers += [prev_layer]
		prev_layer = layer
		# The last layer is the output of the model
		self.outputs.append(prev_layer)

		if loss == "binary_crossentropy":
		smce = SoftMaxCrossEntropy(in_layers=[labels, prev_layer])
		self.set_loss(ReduceMean(in_layers=[smce]))
		elif loss == "mse":
		mse = ReduceSquareDifference(in_layers=[prev_layer, labels])
		self.set_loss(mse)
		else:
		# TODO(rbharath): Add in support for additional
		# losses.
		raise ValueError("Unsupported loss.")

		super(Sequential, self).fit(dataset, **kwargs)

		def restore(self, checkpoint=None):
		"""Not currently supported.
		"""
		# TODO(rbharath): The TensorGraph can't be built until
		# fit is called since the shapes of features/labels
		# not specified. Need to figure out a good restoration
		# method for this use case.
		raise ValueError("Restore is not yet supported " "for sequential models.")

deepchem/models/tensorgraph/tests/test_sequential.py

0 → 100644

+50 −0

Original line number	Diff line number	Diff line
		import unittest
		import numpy as np
		import deepchem as dc
		from deepchem.models.tensorgraph.layers import Dense
		from deepchem.models.tensorgraph.layers import SoftMax
		from nose.tools import assert_true


		class TestSequential(unittest.TestCase):
		"""
		Test that sequential graphs work correctly.
		"""

		def test_single_task_classifier(self):
		n_data_points = 20
		n_features = 2
		X = np.random.rand(n_data_points, n_features)
		y = [[0, 1] for x in range(n_data_points)]
		dataset = dc.data.NumpyDataset(X, y)
		model = dc.models.Sequential(learning_rate=0.01)
		model.add(Dense(out_channels=2))
		model.add(SoftMax())
		model.fit(dataset, loss="binary_crossentropy", nb_epoch=1000)
		prediction = np.squeeze(model.predict_on_batch(X))
		assert_true(np.all(np.isclose(prediction, y, atol=0.4)))

		def test_fit_twice(self):
		n_data_points = 20
		n_features = 2
		X = np.random.rand(n_data_points, n_features)
		y = [[0, 1] for x in range(n_data_points)]
		dataset = dc.data.NumpyDataset(X, y)
		model = dc.models.Sequential(learning_rate=0.01)
		model.add(Dense(out_channels=2))
		model.add(SoftMax())
		# Should be able to call fit twice without failure.
		model.fit(dataset, loss="binary_crossentropy", nb_epoch=1000)
		model.fit(dataset, loss="binary_crossentropy", nb_epoch=1000)

		def test_single_task_regressor(self):
		n_data_points = 20
		n_features = 2
		X = np.random.rand(n_data_points, n_features)
		y = [0.5 for x in range(n_data_points)]
		dataset = dc.data.NumpyDataset(X, y)
		model = dc.models.Sequential(learning_rate=0.01)
		model.add(Dense(out_channels=1))
		model.fit(dataset, loss="mse", nb_epoch=1000)
		prediction = np.squeeze(model.predict_on_batch(X))
		assert_true(np.all(np.isclose(prediction, y, atol=3.0)))

Admin message