Source code for beyondml.tflow.layers.MultiMaskedDense

import numpy as np
import tensorflow as tf
from tensorflow.keras.layers import Layer


[docs]class MultiMaskedDense(Layer): """ Masked multitask fully connected layer. This layer implements multiple stacks of the fully-connected architecture and implements masking with the BeyondML API to support developing sparse multitask models. """ def __init__( self, units, use_bias=True, activation=None, kernel_initializer='random_normal', mask_initializer='ones', bias_initializer='zeros', **kwargs ): """ Parameters ---------- units : int The number of artificial neurons to use use_bias : bool (default True) Whether to use a bias calculation in the outputs activation : None, str, or function (default None) The activation function to use on the outputs kernel_initializer : str or keras initialization function (default 'random_normal') The weight initialization function to use mask_initializer : str or keras initialization function (default 'ones') The mask initialization function to use bias_initializer : str or keras initialization function (default 'zeros') The bias initialization function to use """ super(MultiMaskedDense, self).__init__(**kwargs) self.units = int(units) if not isinstance(units, int) else units self.use_bias = use_bias self.activation = tf.keras.activations.get(activation) self.kernel_initializer = tf.keras.initializers.get(kernel_initializer) self.mask_initializer = tf.keras.initializers.get(mask_initializer) self.bias_initializer = tf.keras.initializers.get(bias_initializer)
[docs] def build(self, input_shape): """ Build the layer in preparation to be trained or called. Should not be called directly, but rather is called when the layer is added to a model """ try: input_shape = [ tuple(shape.as_list()) for shape in input_shape ] except AttributeError: # Sometimes, input shapes come as tuples already pass simplified_shape = input_shape[0] self.w = self.add_weight( shape=(len(input_shape), simplified_shape[-1], self.units), initializer=self.kernel_initializer, trainable=True, name='weights' ) self.w_mask = self.add_weight( shape=self.w.shape, initializer=self.mask_initializer, trainable=False, name='weights_mask' ) if self.use_bias: self.b = self.add_weight( shape=(len(input_shape), self.units), initializer=self.bias_initializer, trainable=True, name='bias' ) self.b_mask = self.add_weight( shape=self.b.shape, initializer=self.mask_initializer, trainable=False, name='bias_mask' )
[docs] def call(self, inputs): """ This is where the layer's logic lives and is called upon inputs Parameters ---------- inputs : TensorFlow Tensor or Tensor-like The inputs to the layer Returns ------- outputs : TensorFlow Tensor The outputs of the layer's logic """ output_tensor = [ tf.matmul(inputs[i], self.w[i] * self.w_mask[i]) for i in range(len(inputs)) ] if self.use_bias: output_tensor = [ output_tensor[i] + (self.b[i] * self.b_mask[i]) for i in range(len(output_tensor)) ] return [self.activation(tensor) for tensor in output_tensor]
[docs] def get_config(self): config = super().get_config().copy() config.update( { 'units': self.units, 'use_bias': self.use_bias, 'activation': tf.keras.activations.serialize(self.activation), 'kernel_initializer': tf.keras.initializers.serialize(self.kernel_initializer), 'mask_initializer': tf.keras.initializers.serialize(self.mask_initializer), 'bias_initializer': tf.keras.initializers.serialize(self.bias_initializer) } ) return config
[docs] def set_masks(self, new_masks): """ Set the masks for the layer Parameters ---------- new_masks : list of arrays or array-likes The new masks to set for the layer """ if not self.use_bias: self.set_weights( [self.w.numpy() * new_masks[0].astype(np.float32), new_masks[0].astype(np.float32)] ) else: self.set_weights( [self.w.numpy() * new_masks[0].astype(np.float32), self.b.numpy() * new_masks[1].astype( np.float32), new_masks[0].astype(np.float32), new_masks[1].astype(np.float32)] )
[docs] @classmethod def from_config(cls, config): return cls( units=config['units'], use_bias=config['use_bias'], activation=config['activation'], kernel_initializer=config['kernel_initializer'], mask_initializer=config['mask_initializer'], bias_initializer=config['bias_initializer'] )