Added Dead ReLU detector callback (#115)

2026-06-27 16:10:11 +08:00 · 2017-07-01 04:08:39 +03:00
parent 8ec9c77382
commit 13ec4b4174
3 changed files with 102 additions and 0 deletions
@@ -1 +1,2 @@
 from .snapshot import SnapshotCallbackBuilder, SnapshotModelCheckpoint
 from .dead_relu_detector import DeadReluDetector
@@ -0,0 +1,60 @@
 import numpy as np
 import warnings
 from keras.callbacks import Callback
 from keras.layers import Dense
 from keras import backend as K
 class DeadReluDetector(Callback):
    """Reports the number of dead ReLUs after each training epoch
    ReLU is considered to be dead if it did not fire once for entire training set
    # Arguments
        x_train: Training dataset to check whether or not neurons fire
        verbose: verbosity mode
            True means that even a single dead neuron triggers warning
            False means that only significant number of dead neurons (10% or more)
            triggers warning
    """
    def __init__(self, x_train, verbose=False):
        super(DeadReluDetector, self).__init__()
        self.x_train = x_train
        self.verbose = verbose
        self.dead_neurons_share_threshold = 0.1
    @staticmethod
    def is_relu_layer(layer):
        return isinstance(layer, Dense) and layer.get_config()['activation'] == 'relu'
    def get_relu_activations(self):
        model_input = self.model.input
        is_multi_input = isinstance(model_input, list)
        if not is_multi_input:
            model_input = [model_input]
        funcs = [K.function(model_input + [K.learning_phase()], [layer.output]) for layer in self.model.layers]
        if is_multi_input:
            list_inputs = []
            list_inputs.extend(self.x_train)
            list_inputs.append(1.)
        else:
            list_inputs = [self.x_train, 1.]
        layer_outputs = [func(list_inputs)[0] for func in funcs]
        for layer_index, layer_activations in enumerate(layer_outputs):
            if self.is_relu_layer(self.model.layers[layer_index]):
                yield [layer_index, layer_activations]
    def on_epoch_end(self, epoch, logs={}):
        for relu_activation in self.get_relu_activations():
            layer_index, activation_values = relu_activation
            total_neurons = activation_values.shape[-1]
            dead_neurons = np.sum(activation_values == 0)
            dead_neurons_share = dead_neurons / total_neurons
            if (self.verbose and dead_neurons > 0) or dead_neurons_share > self.dead_neurons_share_threshold:
                warnings.warn(
                    'Layer #{} has {} dead neurons ({:.2%})!'
                        .format(layer_index, dead_neurons, dead_neurons_share),
                    RuntimeWarning
                )
@@ -0,0 +1,41 @@
 import pytest
 import warnings
 import numpy as np
 from keras_contrib import callbacks
 from keras.models import Sequential
 from keras.layers import Dense
 def test_DeadDeadReluDetector():
    def do_test(weights, expected_warnings, verbose):
        with warnings.catch_warnings(record=True) as w:
            dataset = np.ones((1, 1, 1))    # data to be fed as training
            model = Sequential()
            model.add(Dense(10, activation='relu', input_shape=(1, 1), use_bias=False, weights=[weights]))
            model.compile(optimizer='sgd', loss='categorical_crossentropy')
            model.fit(
                dataset,
                np.ones((1, 1, 10)),
                epochs=1,
                callbacks=[callbacks.DeadReluDetector(dataset, verbose=verbose)],
                verbose=False
            )
            assert len(w) == expected_warnings
            for warn_item in w:
                assert issubclass(warn_item.category, RuntimeWarning)
                assert "dead neurons" in str(warn_item.message)
    weights_1_dead = np.ones((1, 10))      # weights that correspond to NN with 1/10 neurons dead
    weights_1_dead[:, 0] = 0
    weights_2_dead = np.ones((1, 10))      # weights that correspond to NN with 2/10 neurons dead
    weights_2_dead[:, 0] = 0
    weights_2_dead[:, 1] = 0
    do_test(weights_1_dead, verbose=True, expected_warnings=1)
    do_test(weights_1_dead, verbose=False, expected_warnings=0)
    do_test(weights_2_dead, verbose=True, expected_warnings=1)
 if __name__ == '__main__':
    pytest.main([__file__])
`@@ -1 +1,2 @@`
	`from .snapshot import SnapshotCallbackBuilder, SnapshotModelCheckpoint`	`from .snapshot import SnapshotCallbackBuilder, SnapshotModelCheckpoint`
		`from .dead_relu_detector import DeadReluDetector`