Source code for ztlearn.initializers

# -*- coding: utf-8 -*-

import numpy as np

[docs]class WeightInitializer:
[docs] def compute_fans(self, shape): # Original code forked from MIT licensed keras project # # kernel shape: ('NF': Total Filters, 'CF': Filter Channels, 'HF': Filter Height 'WF': Filter Width) shape = (shape[0], 1) if len(shape) == 1 else shape receptive_field_size =[:2]) fan_out = shape[0] * receptive_field_size # NF *receptive_field_size fan_in = shape[1] * receptive_field_size # CF *receptive_field_size return fan_in, fan_out
[docs]class HeNormal(WeightInitializer): """ **He Normal (HeNormal)** HeNormal is a robust initialization method that particularly considers the rectifier nonlinearities. He normal is an implementation based on Gaussian distribution References: [1] Delving Deep into Rectifiers: Surpassing Human-Level Performance on ImageNet Classification * [Kaiming He, 2015] * [PDF] [2] Initialization Of Deep Networks Case of Rectifiers * [DeepGrid Article - Jefkine Kafunah] """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(2. / fan_in) np.random.seed(random_seed) return np.random.normal(loc = 0.0, scale = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class HeUniform(WeightInitializer): """ **He Normal (HeNormal)** HeNormal is a robust initialization method that particularly considers the rectifier nonlinearities. He uniform is an implementation based on Uniform distribution References: [1] Delving Deep into Rectifiers: Surpassing Human-Level Performance on ImageNet Classification * [Kaiming He, 2015] * [PDF] [2] Initialization Of Deep Networks Case of Rectifiers * [DeepGrid Article - Jefkine Kafunah] """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(6. / fan_in) np.random.seed(random_seed) return np.random.uniform(low = -scale, high = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class GlorotNormal(WeightInitializer): """ **Glorot Normal (GlorotNormal)** GlorotNormal, more famously known as the Xavier initialization is based on the effort to try mantain the same variance of the gradients of the weights for all the layers. Glorot normal is an implementation based on Gaussian distribution References: [1] Understanding the difficulty of training deep feedforward neural networks * [Xavier Glorot, 2010] * [PDF] [2] Initialization Of Deep Feedfoward Networks * [DeepGrid Article - Jefkine Kafunah] """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(2. / (fan_in + fan_out)) np.random.seed(random_seed) return np.random.normal(loc = 0.0, scale = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class GlorotUniform(WeightInitializer): """ **Glorot Uniform (GlorotUniform)** GlorotUniform, more famously known as the Xavier initialization is based on the effort to try mantain the same variance of the gradients of the weights for all the layers. Glorot uniform is an implementation based on Uniform distribution References: [1] Understanding the difficulty of training deep feedforward neural networks * [Xavier Glorot, 2010] * [PDF] [2] Initialization Of Deep Feedfoward Networks * [DeepGrid Article - Jefkine Kafunah] """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(6. / (fan_in + fan_out)) np.random.seed(random_seed) return np.random.uniform(low = -scale, high = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class LeCunUniform(WeightInitializer): """ **LeCun Uniform (LeCunUniform)** Weights should be randomly chosen but in such a way that the sigmoid is primarily activated in its linear region. LeCun uniform is an implementation based on Uniform distribution References: [1] Efficient Backprop * [LeCun, 1998][PDF] """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(3. / fan_in) np.random.seed(random_seed) return np.random.uniform(low = -scale, high = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class LeCunNormal(WeightInitializer): """ **LeCun Normal (LeCunNormal)** Weights should be randomly chosen but in such a way that the sigmoid is primarily activated in its linear region. LeCun uniform is an implementation based on Gaussian distribution References: [1] Efficient Backprop * [LeCun, 1998][PDF] """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(1. / fan_in) np.random.seed(random_seed) return np.random.normal(low = -scale, high = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class RandomUniform(WeightInitializer): """ **Random Uniform (RandomUniform)** Random uniform, an implementation of weight initialization based on Uniform distribution """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(1. / (fan_in + fan_out)) np.random.seed(random_seed) return np.random.uniform(low = -scale, high = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class RandomNormal(WeightInitializer): """ **Random Normal (RandomNormal)** Random uniform, an implementation of weight initialization based on Gaussian distribution """
[docs] def weights(self, shape, random_seed): fan_in, fan_out = self.compute_fans(shape) scale = np.sqrt(1. / (fan_in + fan_out)) np.random.seed(random_seed) return np.random.normal(loc = 0.0, scale = scale, size = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class Zero(WeightInitializer): """ **Zero (Zero)** Zero is an implementation of weight initialization that returns all zeros """
[docs] def weights(self, shape, random_seed): return np.zeros(shape = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class One(WeightInitializer): """ **One (One)** One is an implementation of weight initialization that returns all ones """
[docs] def weights(self, shape, random_seed): return np.ones(shape = shape)
@property def init_name(self): return self.__class__.__name__
[docs]class Identity(WeightInitializer): """ **Identity (Identity)** Identity is an implementation of weight initialization that returns an identity matrix of size shape """
[docs] def weights(self, shape, random_seed): return np.eye(shape[0], shape[1], dtype = np.float32)
@property def init_name(self): return self.__class__.__name__
[docs]class InitializeWeights: _methods = { 'ones' : One, 'zeros' : Zero, 'identity' : Identity, 'he_normal' : HeNormal, 'he_uniform' : HeUniform, 'lecun_normal' : LeCunNormal, 'lecun_uniform' : LeCunUniform, 'random_normal' : RandomNormal, 'glorot_normal' : GlorotNormal, 'random_uniform' : RandomUniform, 'glorot_uniform' : GlorotUniform } def __init__(self, name): if name not in self._methods.keys(): raise Exception('Weight initialization method must be either one of the following: {}.'.format(', '.join(self._methods.keys()))) self.init_method = self._methods[name]() @property def name(self): return self.init_method.init_name
[docs] def initialize_weights(self, shape, random_seed = None): return self.init_method.weights(shape, random_seed)