Update branch (ee9fbe2f) · Commits · 钟慕尧 / deepchem

.gitignore

+4 −0

Original line number	Diff line number	Diff line
		@@ -63,3 +63,7 @@ target/
		# IDE files
		.idea
		*.iml

		# Vim swap
		*.swp

.travis.yml

+2 −2

Original line number	Diff line number	Diff line
		@@ -15,7 +15,7 @@ install:
		- conda config --add channels http://conda.binstar.org/omnia
		- bash scripts/install_deepchem_conda.sh deepchem
		- source activate deepchem
		- pip install yapf==0.20.0
		- pip install yapf==0.22.0
		- pip install coveralls
		- python setup.py install
		script:

Dockerfile

+8 −17

Original line number	Diff line number	Diff line
		FROM nvidia/cuda
		FROM nvidia/cuda:9.0-cudnn7-runtime

		# Install some utilities
		RUN apt-get update && \
		apt-get install -y -q wget git libxrender1 libsm6 && \
		apt-get install -y -q wget git libxrender1 libsm6 bzip2 && \
		apt-get clean

		# Install miniconda
		RUN MINICONDA="Miniconda2-latest-Linux-x86_64.sh" && \
		RUN MINICONDA="Miniconda3-latest-Linux-x86_64.sh" && \
		wget --quiet https://repo.continuum.io/miniconda/$MINICONDA && \
		bash $MINICONDA -b -p /miniconda && \
		rm -f $MINICONDA
		ENV PATH /miniconda/bin:$PATH

		# Install deepchem conda package from omnia
		# TODO: Uncomment this when there is a stable release of deepchem.
		#RUN conda config --add channels omnia
		#RUN conda install --yes deepchem

		# Install deepchem with GPU support from github using Tue 14 Mar 2017 git head
		# TODO: Get rid of this when there is a stable release of deepchem.
		RUN git clone https://github.com/deepchem/deepchem.git && \
		RUN conda update -n base conda
		RUN export LANG=en_US.UTF-8 && \
		git clone https://github.com/deepchem/deepchem.git && \
		cd deepchem && \
		git checkout tags/1.3.1 && \
		git checkout 2.0.0 && \
		sed -i -- 's/tensorflow$/tensorflow-gpu/g' scripts/install_deepchem_conda.sh && \
		bash scripts/install_deepchem_conda.sh root && \
		bash scripts/install_deepchem_conda.sh && \
		python setup.py develop

		# Clean up
		RUN cd deepchem && \
		git clean -fX

		# Run tests
		#RUN pip install nose && \
		# nosetests -v deepchem --nologcapture

README.md

+5 −4

Original line number	Diff line number	Diff line
		@@ -59,12 +59,13 @@ git clone https://github.com/deepchem/deepchem.git # Clone deepchem source
		cd deepchem
		bash scripts/install_deepchem_conda.sh deepchem
		source activate deepchem
		yes \| pip install tensorflow-gpu==1.5.0 # If you want GPU support
		yes \| pip install tensorflow-gpu==1.6.0 # If you want GPU support
		python setup.py install # Manual install
		nosetests -a '!slow' -v deepchem --nologcapture # Run tests
		```
		This creates a new conda environment `deepchem` and installs in it the dependencies that
		are needed. To access it, use the `source activate deepchem` command.
		are needed. To access it, use the `conda activate deepchem` command (if your conda version >= 4.4) and use `source activate deepchem` command (if your conda version < 4.4).

		Check [this link](https://conda.io/docs/using/envs.html) for more information about
		the benefits and usage of conda environments. Warning: Segmentation faults can [still happen](https://github.com/deepchem/deepchem/pull/379#issuecomment-277013514)
		via this installation procedure.
		@@ -72,7 +73,7 @@ via this installation procedure.
		### Easy Install via Conda

		```bash
		conda install -c deepchem -c rdkit -c conda-forge -c omnia deepchem=1.3.1
		conda install -c deepchem -c rdkit -c conda-forge -c omnia deepchem=2.0.0
		```
		Note: `Easy Install` installs the latest stable version of `deepchem` and _does not install from source_. If you need to install from source make sure you follow the steps [here](#using-a-conda-environment).

		@@ -182,4 +183,4 @@ DeepChem is supported by a number of corporate partners who use DeepChem to solv


		## Version
		1.3.1
		2.0.0

contrib/laplacian/petroskisuch.py

0 → 100644

+165 −0

Original line number	Diff line number	Diff line
		import collections

		import numpy as np
		import six
		import tensorflow as tf

		from deepchem.data import NumpyDataset
		from deepchem.feat.graph_features import ConvMolFeaturizer
		from deepchem.feat.mol_graphs import ConvMol
		from deepchem.metrics import to_one_hot
		from deepchem.models.tensorgraph.graph_layers import WeaveGather, \
		DTNNEmbedding, DTNNStep, DTNNGather, DAGLayer, \
		DAGGather, DTNNExtract, MessagePassing, SetGather
		from deepchem.models.tensorgraph.graph_layers import WeaveLayerFactory
		from deepchem.models.tensorgraph.layers import Dense, SoftMax, \
		SoftMaxCrossEntropy, GraphConv, BatchNorm, \
		GraphPool, GraphGather, WeightedError, Dropout, BatchNorm, Stack, Flatten, GraphCNN, GraphCNNPool
		from deepchem.models.tensorgraph.layers import L2Loss, Label, Weights, Feature
		from deepchem.models.tensorgraph.tensor_graph import TensorGraph
		from deepchem.trans import undo_transforms


		class PetroskiSuchModel(TensorGraph):
		"""
		Model from Robust Spatial Filtering with Graph Convolutional Neural Networks
		https://arxiv.org/abs/1703.00792
		"""

		def __init__(self,
		n_tasks,
		max_atoms=200,
		dropout=0.0,
		mode="classification",
		**kwargs):
		"""
		Parameters
		----------
		n_tasks: int
		Number of tasks
		mode: str
		Either "classification" or "regression"
		"""
		self.n_tasks = n_tasks
		self.mode = mode
		self.max_atoms = max_atoms
		self.error_bars = True if 'error_bars' in kwargs and kwargs['error_bars'] else False
		self.dropout = dropout
		kwargs['use_queue'] = False
		super(PetroskiSuchModel, self).__init__(**kwargs)
		self.build_graph()

		def build_graph(self):
		self.vertex_features = Feature(shape=(None, self.max_atoms, 75))
		self.adj_matrix = Feature(shape=(None, self.max_atoms, 1, self.max_atoms))
		self.mask = Feature(shape=(None, self.max_atoms, 1))

		gcnn1 = BatchNorm(
		GraphCNN(
		num_filters=64,
		in_layers=[self.vertex_features, self.adj_matrix, self.mask]))
		gcnn1 = Dropout(self.dropout, in_layers=gcnn1)
		gcnn2 = BatchNorm(
		GraphCNN(num_filters=64, in_layers=[gcnn1, self.adj_matrix, self.mask]))
		gcnn2 = Dropout(self.dropout, in_layers=gcnn2)
		gc_pool, adj_matrix = GraphCNNPool(
		num_vertices=32, in_layers=[gcnn2, self.adj_matrix, self.mask])
		gc_pool = BatchNorm(gc_pool)
		gc_pool = Dropout(self.dropout, in_layers=gc_pool)
		gcnn3 = BatchNorm(GraphCNN(num_filters=32, in_layers=[gc_pool, adj_matrix]))
		gcnn3 = Dropout(self.dropout, in_layers=gcnn3)
		gc_pool2, adj_matrix2 = GraphCNNPool(
		num_vertices=8, in_layers=[gcnn3, adj_matrix])
		gc_pool2 = BatchNorm(gc_pool2)
		gc_pool2 = Dropout(self.dropout, in_layers=gc_pool2)
		flattened = Flatten(in_layers=gc_pool2)
		readout = Dense(
		out_channels=256, activation_fn=tf.nn.relu, in_layers=flattened)
		costs = []
		self.my_labels = []
		for task in range(self.n_tasks):
		if self.mode == 'classification':
		classification = Dense(
		out_channels=2, activation_fn=None, in_layers=[readout])

		softmax = SoftMax(in_layers=[classification])
		self.add_output(softmax)

		label = Label(shape=(None, 2))
		self.my_labels.append(label)
		cost = SoftMaxCrossEntropy(in_layers=[label, classification])
		costs.append(cost)
		if self.mode == 'regression':
		regression = Dense(
		out_channels=1, activation_fn=None, in_layers=[readout])
		self.add_output(regression)

		label = Label(shape=(None, 1))
		self.my_labels.append(label)
		cost = L2Loss(in_layers=[label, regression])
		costs.append(cost)
		if self.mode == "classification":
		entropy = Stack(in_layers=costs, axis=-1)
		elif self.mode == "regression":
		entropy = Stack(in_layers=costs, axis=1)
		self.my_task_weights = Weights(shape=(None, self.n_tasks))
		loss = WeightedError(in_layers=[entropy, self.my_task_weights])
		self.set_loss(loss)

		def default_generator(self,
		dataset,
		epochs=1,
		predict=False,
		deterministic=True,
		pad_batches=True):
		for epoch in range(epochs):
		if not predict:
		print('Starting epoch %i' % epoch)
		for ind, (X_b, y_b, w_b, ids_b) in enumerate(
		dataset.iterbatches(
		self.batch_size, pad_batches=True, deterministic=deterministic)):
		d = {}
		for index, label in enumerate(self.my_labels):
		if self.mode == 'classification':
		d[label] = to_one_hot(y_b[:, index])
		if self.mode == 'regression':
		d[label] = np.expand_dims(y_b[:, index], -1)
		d[self.my_task_weights] = w_b
		d[self.adj_matrix] = np.expand_dims(np.array([x[0] for x in X_b]), -2)
		d[self.vertex_features] = np.array([x[1] for x in X_b])
		mask = np.zeros(shape=(self.batch_size, self.max_atoms, 1))
		for i in range(self.batch_size):
		mask_size = X_b[i][2]
		mask[i][:mask_size][0] = 1
		d[self.mask] = mask
		yield d

		def predict_proba_on_generator(self, generator, transformers=[]):
		if not self.built:
		self.build()
		with self._get_tf("Graph").as_default():
		out_tensors = [x.out_tensor for x in self.outputs]
		results = []
		for feed_dict in generator:
		feed_dict = {
		self.layers[k.name].out_tensor: v
		for k, v in six.iteritems(feed_dict)
		}
		feed_dict[self._training_placeholder] = 1.0 ##
		result = np.array(self.session.run(out_tensors, feed_dict=feed_dict))
		if len(result.shape) == 3:
		result = np.transpose(result, axes=[1, 0, 2])
		if len(transformers) > 0:
		result = undo_transforms(result, transformers)
		results.append(result)
		return np.concatenate(results, axis=0)

		def evaluate(self, dataset, metrics, transformers=[], per_task_metrics=False):
		if not self.built:
		self.build()
		return self.evaluate_generator(
		self.default_generator(dataset, predict=True),
		metrics,
		labels=self.my_labels,
		weights=[self.my_task_weights],
		per_task_metrics=per_task_metrics)

Admin message