First linear layer (eb7a2f48) · Commits · 钟慕尧 / deepchem

deepchem/models/jax_models/layers.py

0 → 100644

+103 −0

Original line number	Diff line number	Diff line
		import math
		import numpy as np
		import logging
		try:
		import jax.numpy as jnp
		import jax
		import haiku as hk
		except:
		raise ImportError('These classes require Jax and Haiku to be installed.')

		logger = logging.getLogger(__name__)


		class Linear(hk.Module):
		"""Protein folding specific Linear Module.

		This differs from the standard Haiku Linear in a few ways:
		* It supports inputs of arbitrary rank
		* Initializers are specified by strings

		This code is adapted from DeepMind's AlphaFold code release
		(https://github.com/deepmind/alphafold).

		Examples
		--------
		>>> import deepchem as dc
		>>> import haiku as hk
		>>> import deepchem.models.jax_models.layers
		>>> def forward_model(x):
		... layer = dc.models.jax_models.layers.Linear(2)
		... return layer(x)
		>>> f = hk.transform(forward_model)
		>>> rng = jax.random.PRNGKey(42)
		>>> x = jnp.ones([8, 28 * 28])
		>>> params = f.init(rng, x)
		>>> output = f.apply(params, rng, x)
		"""

		def __init__(self,
		num_output: int,
		initializer: str = 'linear',
		use_bias: bool = True,
		bias_init: float = 0.,
		name: str = 'linear'):
		"""Constructs Linear Module.

		Parameters
		----------
		num_output: int
		number of output channels.
		initializer: str (default 'linear')
		What initializer to use, should be one of {'linear', 'relu', 'zeros'}
		use_bias: bool (default True)
		Whether to include trainable bias
		bias_init: float (default 0)
		Value used to initialize bias.
		name: str (default 'linear')
		name of module, used for name scopes.
		"""

		super().__init__(name=name)
		self.num_output = num_output
		self.initializer = initializer
		self.use_bias = use_bias
		self.bias_init = bias_init

		def __call__(self, inputs: jnp.ndarray) -> jnp.ndarray:
		"""Connects Module.

		Parameters
		----------
		inputs: jnp.ndarray
		Tensor of shape [..., num_channel]

		Returns
		-------
		output of shape [..., num_output]
		"""
		n_channels = int(inputs.shape[-1])

		weight_shape = [n_channels, self.num_output]
		if self.initializer == 'linear':
		weight_init = hk.initializers.VarianceScaling(mode='fan_in', scale=1.)
		elif self.initializer == 'relu':
		weight_init = hk.initializers.VarianceScaling(mode='fan_in', scale=2.)
		elif self.initializer == 'zeros':
		weight_init = hk.initializers.Constant(0.0)

		weights = hk.get_parameter('weights', weight_shape, inputs.dtype,
		weight_init)

		# this is equivalent to einsum('...c,cd->...d', inputs, weights)
		# but turns out to be slightly faster
		inputs = jnp.swapaxes(inputs, -1, -2)
		output = jnp.einsum('...cb,cd->...db', inputs, weights)
		output = jnp.swapaxes(output, -1, -2)

		if self.use_bias:
		bias = hk.get_parameter('bias', [self.num_output], inputs.dtype,
		hk.initializers.Constant(self.bias_init))
		output += bias

		return output

deepchem/models/jax_models/tests/test_layers.py

0 → 100644

+29 −0

Original line number	Diff line number	Diff line
		import pytest
		import deepchem as dc
		import numpy as np

		try:
		import jax
		import jax.numpy as jnp
		from jax import random
		import haiku as hk
		except:
		has_haiku_and_optax = False


		@pytest.mark.jax
		def test_linear():
		import deepchem as dc
		import haiku as hk
		import deepchem.models.jax_models.layers

		def forward(x):
		layer = dc.models.jax_models.layers.Linear(2)
		return layer(x)

		forward = hk.transform(forward)
		rng = jax.random.PRNGKey(42)
		x = jnp.ones([8, 28 * 28])
		params = forward.init(rng, x)
		output = forward.apply(params, rng, x)
		assert output.shape == (8, 2)

Admin message