blocks.graph.batch_normalize() - Code Metrics - Inspection of "WIP: Brick-based batch normalization." - mila-udem/blocks - Measure and Improve Code Quality continuously with Scrutinizer

Completed

Pull Request — master (#941)

by David

created 2016-01-18 05:20 UTC

blocks.graph.batch_normalize() F

↳ Parent: Project

Complexity

Conditions

Size

Total Lines

102

Duplication

Lines	0
Ratio	0 %

Metric	Value
cc	14
dl	0
loc	102
rs	2

3 Methods

Rating	Name	Size	Complexity
A	blocks.graph.prepare_replacement()	8	1
A	blocks.graph.get_application_call_dict()	3	2
A	blocks.graph.make_variable_filter()	3	1

How to fix Long Method Complexity

import collections
from theano import tensor

from . import add_annotation
from ..roles import (BATCH_NORM_OFFSET, BATCH_NORM_DIVISOR,
                     BATCH_NORM_POPULATION_STATISTICS,
                     BATCH_NORM_MINIBATCH_ESTIMATE, INPUT, add_role,
                     has_roles)


def batch_normalize(computation_graph, epsilon=1e-4):
    """Activate batch normalization in a graph.

    Parameters
    ----------
    computation_graph : instance of :class:`ComputationGraph`
        The computation graph containing :class:`BatchNormalization`
        brick applications.
    epsilon : float, optional
        The stabilizing constant for the minibatch standard deviation
        computation. Added to the variance inside the square root, as
        in the batch normalization paper.

    Returns
    -------
    batch_normed_computation_graph : instance of :class:`ComputationGraph`
        The computation graph, with :class:`BatchNormalization`
        applications transformed to use minibatch statistics instead
        of accumulated population statistics.
    population_to_minibatch : OrderedDict
        A mapping of variables used in the original graph for population
        means and standard deviations to the minibatch-derived quantities
        that replace them. Useful to define updates in order to track
        the approximate population statistics during learning.

    Notes
    -----
    Assumes the minibatch axis is 0. Other axes are unsupported at
    this time.

    """
    # Avoid a circular import.
    from ..filter import VariableFilter, get_application_call

    # Create filters for variables involved in a batch normalization brick
    # application.
    def make_variable_filter(role):
        from blocks.bricks import BatchNormalization
        return VariableFilter(bricks=[BatchNormalization], roles=[role])

    mean_filter, stdev_filter, input_filter = map(make_variable_filter,
                                                  [BATCH_NORM_OFFSET,
                                                   BATCH_NORM_DIVISOR, INPUT])

    # Group means, standard deviations, and inputs into dicts indexed by
    # application call.
    def get_application_call_dict(variable_filter):
        return collections.OrderedDict((get_application_call(v), v) for v in
                                       variable_filter(computation_graph))

    means, stdevs, inputs = map(get_application_call_dict,
                                [mean_filter, stdev_filter, input_filter])

    assert (set(means.keys()) == set(stdevs.keys()) and
            set(means.keys()) == set(inputs.keys()))
    assert set(means.values()).isdisjoint(stdevs.values())

    replacements = []
    # Perform replacement for each application call.
    for application_call in means:
        axes = tuple(i for i, b in enumerate(means[application_call]
                                             .broadcastable) if b)
        minibatch_mean = inputs[application_call].mean(axis=axes,
                                                       keepdims=True)
        minibatch_mean.name = 'minibatch_offset'
        # Stabilize in the same way as the batch normalization manuscript.
        minibatch_std = tensor.sqrt(tensor.var(inputs[application_call],
                                               axis=axes, keepdims=True) +
                                    epsilon)
        minibatch_std.name = 'minibatch_divisor'

        def prepare_replacement(old, new, role, application_call):
            """Add roles and tags to replaced variables."""
            add_role(new, BATCH_NORM_MINIBATCH_ESTIMATE)
            add_role(new, role)
            add_annotation(new, application_call)
            add_annotation(new, application_call.application.brick)
            new.tag.replacement_of = old
            replacements.append((old, new))

        prepare_replacement(means[application_call], minibatch_mean,
                            BATCH_NORM_OFFSET, application_call)
        prepare_replacement(stdevs[application_call], minibatch_std,
                            BATCH_NORM_DIVISOR, application_call)

    new_graph = computation_graph.replace(replacements)

    population_to_minibatch = collections.OrderedDict()
    for original_graph_node, replacement in replacements:
        pop_stats = original_graph_node
        while not has_roles(pop_stats, [BATCH_NORM_POPULATION_STATISTICS]):
            pop_stats = pop_stats.owner.inputs[0]
        # Above, we are replacing a node that has a batch axis added to it
        # with a replacement formed via a reduction with keepdims=True. In
        # order for the actual shared variable and the replacement to have
        # compatible dimensions, we need to drop the leading axis of the
        # replacement.
        replacement = replacement[0]
        assert pop_stats.dtype == replacement.dtype
        assert pop_stats.broadcastable == replacement.broadcastable
        population_to_minibatch[pop_stats] = replacement
    return new_graph, population_to_minibatch


1			import collections
2			from theano import tensor
3
4			from . import add_annotation
5			from ..roles import (BATCH_NORM_OFFSET, BATCH_NORM_DIVISOR,
6			BATCH_NORM_POPULATION_STATISTICS,
7			BATCH_NORM_MINIBATCH_ESTIMATE, INPUT, add_role,
8			has_roles)
9
10
11			def batch_normalize(computation_graph, epsilon=1e-4):
12			"""Activate batch normalization in a graph.
13
14			Parameters
15			----------
16			computation_graph : instance of :class:`ComputationGraph`
17			The computation graph containing :class:`BatchNormalization`
18			brick applications.
19			epsilon : float, optional
20			The stabilizing constant for the minibatch standard deviation
21			computation. Added to the variance inside the square root, as
22			in the batch normalization paper.
23
24			Returns
25			-------
26			batch_normed_computation_graph : instance of :class:`ComputationGraph`
27			The computation graph, with :class:`BatchNormalization`
28			applications transformed to use minibatch statistics instead
29			of accumulated population statistics.
30			population_to_minibatch : OrderedDict
31			A mapping of variables used in the original graph for population
32			means and standard deviations to the minibatch-derived quantities
33			that replace them. Useful to define updates in order to track
34			the approximate population statistics during learning.
35
36			Notes
37			-----
38			Assumes the minibatch axis is 0. Other axes are unsupported at
39			this time.
40
41			"""
42			# Avoid a circular import.
43			from ..filter import VariableFilter, get_application_call
44
45			# Create filters for variables involved in a batch normalization brick
46			# application.
47			def make_variable_filter(role):
48			from blocks.bricks import BatchNormalization
49			return VariableFilter(bricks=[BatchNormalization], roles=[role])
50
51			mean_filter, stdev_filter, input_filter = map(make_variable_filter,
52			[BATCH_NORM_OFFSET,
53			BATCH_NORM_DIVISOR, INPUT])
54
55			# Group means, standard deviations, and inputs into dicts indexed by
56			# application call.
57			def get_application_call_dict(variable_filter):
58			return collections.OrderedDict((get_application_call(v), v) for v in
59			variable_filter(computation_graph))
60
61			means, stdevs, inputs = map(get_application_call_dict,
62			[mean_filter, stdev_filter, input_filter])
63
64			assert (set(means.keys()) == set(stdevs.keys()) and
65			set(means.keys()) == set(inputs.keys()))
66			assert set(means.values()).isdisjoint(stdevs.values())
67
68			replacements = []
69			# Perform replacement for each application call.
70			for application_call in means:
71			axes = tuple(i for i, b in enumerate(means[application_call]
72			.broadcastable) if b)
73			minibatch_mean = inputs[application_call].mean(axis=axes,
74			keepdims=True)
75			minibatch_mean.name = 'minibatch_offset'
76			# Stabilize in the same way as the batch normalization manuscript.
77			minibatch_std = tensor.sqrt(tensor.var(inputs[application_call],
78			axis=axes, keepdims=True) +
79			epsilon)
80			minibatch_std.name = 'minibatch_divisor'
81
82			def prepare_replacement(old, new, role, application_call):
83			"""Add roles and tags to replaced variables."""
84			add_role(new, BATCH_NORM_MINIBATCH_ESTIMATE)
85			add_role(new, role)
86			add_annotation(new, application_call)
87			add_annotation(new, application_call.application.brick)
88			new.tag.replacement_of = old
89			replacements.append((old, new))
90
91			prepare_replacement(means[application_call], minibatch_mean,
92			BATCH_NORM_OFFSET, application_call)
93			prepare_replacement(stdevs[application_call], minibatch_std,
94			BATCH_NORM_DIVISOR, application_call)
95
96			new_graph = computation_graph.replace(replacements)
97
98			population_to_minibatch = collections.OrderedDict()
99			for original_graph_node, replacement in replacements:
100			pop_stats = original_graph_node
101			while not has_roles(pop_stats, [BATCH_NORM_POPULATION_STATISTICS]):
102			pop_stats = pop_stats.owner.inputs[0]
103			# Above, we are replacing a node that has a batch axis added to it
104			# with a replacement formed via a reduction with keepdims=True. In
105			# order for the actual shared variable and the replacement to have
106			# compatible dimensions, we need to drop the leading axis of the
107			# replacement.
108			replacement = replacement[0]
109			assert pop_stats.dtype == replacement.dtype
110			assert pop_stats.broadcastable == replacement.broadcastable
111			population_to_minibatch[pop_stats] = replacement
112			return new_graph, population_to_minibatch
113

mila-udem / blocks

Pull Request — master (#941)

blocks.graph.batch_normalize() F

Complexity

Size

Duplication

3 Methods

How to fix Long Method Complexity

Long Method

Complexity

Duplication Side-by-Side

Filter issues like