blocks.graph.ComputationGraph - Code Metrics - Inspection of "WIP: Brick-based batch normalization." - mila-udem/blocks - Measure and Improve Code Quality continuously with Scrutinizer

Completed

Pull Request — master (#941)

by David

created 2016-01-20 23:19 UTC

blocks.graph.ComputationGraph F

↳ Parent: Project

Complexity

Total Complexity

Size/Duplication

Total Lines	282
Duplicated Lines	0 %

Metric	Value
dl	0
loc	282
rs	3.3333
wmc	65

14 Methods

Rating	Name	Size	Complexity
A	inputs()	4	3
A	shared_variables()	3	3
B	replace()	86	6
A	auxiliary_variables()	3	3
A	get_theano_function()	15	2
A	__init__()	6	2
A	__iter__()	2	1
A	scan_variables()	4	2
A	parameters()	4	3
A	intermediary_variables()	5	4
F	_get_variables()	49	21
B	has_inputs()	19	6
C	get_snapshot()	24	7
A	dict_of_inputs()	3	2

How to fix Complexity

"""Annotated computation graph management."""
import logging
from collections import OrderedDict
from itertools import chain
import warnings

import numpy
import theano
from picklable_itertools.extras import equizip
from theano import Variable
from theano.gof import graph
from theano.sandbox.rng_mrg import MRG_RandomStreams
from theano.scan_module.scan_op import Scan
from toolz import unique

from ..config import config
from ..roles import (add_role, has_roles, AUXILIARY, PARAMETER, DROPOUT,
                     COLLECTED, COLLECTOR)
from ..utils import (is_graph_input, is_shared_variable, dict_union,
                     shared_floatx_zeros, shared_like)
from .annotations import add_annotation, Annotation  # noqa
from .bn import batch_normalization, apply_batch_normalization  # noqa

logger = logging.getLogger(__name__)


class ComputationGraph(object):
    r"""Encapsulates a managed Theano computation graph.

    This implies that it not only contains the variables required to
    compute the given outputs, but also all the auxiliary variables and
    updates that were attached to these variables through the annotation
    system.

    All variables are presented in topologically sorted order according to
    the apply nodes that they are an input to.

    Parameters
    ----------
    outputs : (list of) :class:`~tensor.TensorVariable`
        The output(s) of the computation graph.

    Attributes
    ----------
    inputs : list of :class:`~tensor.TensorVariable`
        The inputs of the computation graph. This does not include shared
        variables and constants.
    shared_variables : list of :class:`~tensor.TensorSharedVariable`
        All the shared variables in the graph.
    parameters : list of :class:`~tensor.TensorSharedVariable`
        All the shared variables which have the :const:`.PARAMETER` role.
    outputs : list of :class:`~tensor.TensorVariable`
        The outputs of the computations graph (as passed to the
        constructor).
    auxiliary_variables : list of :class:`~tensor.TensorVariable`
        All variables which have the :const:`.AUXILIARY` role.
    intermediary_variables : list of :class:`~tensor.TensorVariable`
        Any variable that is not part of :attr:`inputs` or :attr:`outputs`.
    variables : list of :class:`~tensor.TensorVariable`
        All variables (including auxiliary) in the managed graph.
    scans : list of :class:`~theano.scan_module.scan_op.Scan`
        All Scan ops used in this computation graph.
    scan_variables : list of :class:`~tensor.TensorVariable`
        All variables of the inner graphs of Scan ops.
    updates : :class:`~tensor.TensorSharedVariable` updates
        All the updates found attached to the annotations.

    """
    def __init__(self, outputs):
        if isinstance(outputs, Variable):
            outputs = [outputs]
        self.outputs = outputs
        self._get_variables()
        self._has_inputs = {}

    def __iter__(self):
        return iter(self.variables)

    @property
    def inputs(self):
        """Inputs to the graph, excluding constants and shared variables."""
        return [var for var in self.variables if is_graph_input(var)]

    @property
    def intermediary_variables(self):
        return [var for var in self.variables if
                var not in self.inputs and
                var not in self.outputs]

    @property
    def shared_variables(self):
        return [var for var in self.variables if is_shared_variable(var)]

    @property
    def parameters(self):
        return [var for var in self.shared_variables
                if has_roles(var, [PARAMETER])]

    @property
    def auxiliary_variables(self):
        return [var for var in self.variables if has_roles(var, [AUXILIARY])]

    @property
    def scan_variables(self):
        """Variables of Scan ops."""
        return list(chain(*[g.variables for g in self._scan_graphs]))

    def _get_variables(self):
        """Collect variables, updates and auxiliary variables.

        In addition collects all :class:`.Scan` ops and recurses in the
        respective inner Theano graphs.

        """
        updates = OrderedDict()

        shared_outputs = [o for o in self.outputs if is_shared_variable(o)]
        usual_outputs = [o for o in self.outputs if not is_shared_variable(o)]
        variables = shared_outputs

        if usual_outputs:
            # Sort apply nodes topologically, get variables and remove
            # duplicates
            inputs = graph.inputs(self.outputs)
            sorted_apply_nodes = graph.io_toposort(inputs, usual_outputs)
            self.scans = list(unique([node.op for node in sorted_apply_nodes
                                     if isinstance(node.op, Scan)]))
            self._scan_graphs = [ComputationGraph(scan.outputs)
                                 for scan in self.scans]

            seen = set()
            main_vars = (
                [var for var in list(chain(
                    *[apply_node.inputs for apply_node in sorted_apply_nodes]))
                 if not (var in seen or seen.add(var))] +
                [var for var in self.outputs if var not in seen])

            # While preserving order add auxiliary variables, and collect
            # updates
            seen = set()
            # Intermediate variables could be auxiliary
            seen_avs = set(main_vars)
            variables = []
            for var in main_vars:
                variables.append(var)
                for annotation in getattr(var.tag, 'annotations', []):
                    if annotation not in seen:
                        seen.add(annotation)
                        new_avs = [
                            av for av in annotation.auxiliary_variables
                            if not (av in seen_avs or seen_avs.add(av))]
                        variables.extend(new_avs)
                        updates = dict_union(updates, annotation.updates)

        self.variables = variables
        self.updates = updates

    def dict_of_inputs(self):
        """Return a mapping from an input name to the input."""
        return {var.name: var for var in self.inputs}

    def replace(self, replacements):
        """Replace certain variables in the computation graph.

        Parameters
        ----------
        replacements : dict
            The mapping from variables to be replaced to the corresponding
            substitutes.

        Examples
        --------
        >>> import theano
        >>> from theano import tensor, function
        >>> x = tensor.scalar('x')
        >>> y = x + 2
        >>> z = y + 3
        >>> a = z + 5

        Let's suppose we have dependent replacements like

        >>> replacements = {y: x * 2, z: y * 3}
        >>> cg = ComputationGraph([a])
        >>> theano.pprint(a)  # doctest: +NORMALIZE_WHITESPACE
        '(((x + TensorConstant{2}) + TensorConstant{3}) +
        TensorConstant{5})'
        >>> cg_new = cg.replace(replacements)
        >>> theano.pprint(
        ...     cg_new.outputs[0])  # doctest: +NORMALIZE_WHITESPACE
        '(((x * TensorConstant{2}) * TensorConstant{3}) +
        TensorConstant{5})'

        First two sums turned into multiplications

        >>> float(function(cg_new.inputs, cg_new.outputs)(3.)[0])
        23.0

        """
        # Due to theano specifics we have to make one replacement in time
        replacements = OrderedDict(replacements)

        outputs_cur = self.outputs

        # `replacements` with previous replacements applied. We have to track
        # variables in the new graph corresponding to original replacements.
        replacement_keys_cur = []
        replacement_vals_cur = []
        # Sort `replacements` in topological order
        # variables in self.variables are in topological order
        remaining_replacements = replacements.copy()
        for variable in self.variables:
            if variable in replacements:
                if has_roles(variable, [AUXILIARY]):
                    warnings.warn(
                        "replace method was asked to replace a variable ({}) "
                        "that is an auxiliary variable.".format(variable))
                replacement_keys_cur.append(variable)
                # self.variables should not contain duplicates,
                # otherwise pop() may fail.
                replacement_vals_cur.append(
                    remaining_replacements.pop(variable))

        # if remaining_replacements is not empty
        if remaining_replacements:
            warnings.warn(
                "replace method was asked to replace a variable(s) ({}) "
                "that is not a part of the computational "
                "graph.".format(str(remaining_replacements.keys())))

        # Replace step-by-step in topological order
        while replacement_keys_cur:
            replace_what = replacement_keys_cur[0]
            replace_by = replacement_vals_cur[0]
            # We also want to make changes in future replacements
            outputs_new = theano.clone(
                outputs_cur + replacement_keys_cur[1:] +
                replacement_vals_cur[1:],
                replace={replace_what: replace_by})
            # Reconstruct outputs, keys, and values
            outputs_cur = outputs_new[:len(outputs_cur)]
            replacement_keys_cur = outputs_new[len(outputs_cur):
                                               len(outputs_cur) +
                                               len(replacement_keys_cur) - 1]
            replacement_vals_cur = outputs_new[len(outputs_cur) +
                                               len(replacement_keys_cur):]

        return ComputationGraph(outputs_cur)

    def get_theano_function(self, additional_updates=None, **kwargs):
        r"""Create Theano function from the graph contained.

        Parameters
        ----------
        \*\*kwargs : dict
            Keyword arguments to theano.function.
            Useful for specifying compilation modes or profiling.

        """
        updates = self.updates
        if additional_updates:
            updates = dict_union(updates, OrderedDict(additional_updates))
        return theano.function(self.inputs, self.outputs, updates=updates,
                               **kwargs)

    def get_snapshot(self, data):
        """Evaluate all role-carrying Theano variables on given data.

        Parameters
        ----------
        data : dict of (data source, data) pairs
            Data for input variables. The sources should match with the
            names of the input variables.

        Returns
        -------
        Dictionary of (variable, variable value on given data) pairs.

        """
        role_variables = [var for var in self.variables
                          if hasattr(var.tag, "roles") and
                          not is_shared_variable(var)]
        value_holders = [shared_like(var) for var in role_variables]
        function = self.get_theano_function(equizip(value_holders,
                                                    role_variables))
        function(*(data[input_.name] for input_ in self.inputs))
        return OrderedDict([(var, value_holder.get_value(borrow=True))
                            for var, value_holder in equizip(role_variables,
                                                             value_holders)])

    def has_inputs(self, variable):
        """Check if a variable depends on input variables.

        Returns
        -------
        bool
            ``True`` if the given variable depends on input variables,
            ``False`` otherwise.

        """
        if variable not in self._has_inputs:
            self._has_inputs[variable] = False
            if is_graph_input(variable):
                self._has_inputs[variable] = True
            elif getattr(variable, 'owner', None):
                for dependancy in variable.owner.inputs:
                    if self.has_inputs(dependancy):
                        self._has_inputs[variable] = True
        return self._has_inputs[variable]


def apply_noise(computation_graph, variables, level, seed=None):
    """Add Gaussian noise to certain variable of a computation graph.

    Parameters
    ----------
    computation_graph : instance of :class:`ComputationGraph`
        The computation graph.
    variables : :class:`~tensor.TensorVariable`
        Variables to add noise to.
    level : float
        Noise level.
    seed : int, optional
        The seed with which
        :class:`~theano.sandbox.rng_mrg.MRG_RandomStreams` is initialized,
        is set to 1 by default.

    """
    if not seed:
        seed = config.default_seed
    rng = MRG_RandomStreams(seed)
    replace = {}
    for variable in variables:
        replace[variable] = (variable +
                             rng.normal(variable.shape, std=level))
    return computation_graph.replace(replace)


def collect_parameters(computation_graph, parameters):
    """Replace parameters with a single shared variable.

    This can be useful if you need to calculate the full Hessian of a
    computational graph. It replaces parameters with slices of a single
    large vectors like

    >>> from blocks.utils import shared_floatx
    >>> W1 = shared_floatx(numpy.random.rand(10, 10))
    >>> W2 = shared_floatx(numpy.random.rand(10, 10))
    >>> all_parameters = shared_floatx(numpy.concatenate(
    ...     [W1.get_value().flatten(), W2.get_value().flatten()]))
    >>> W1 = all_parameters[:W1.size]
    >>> W2 = all_parameters[W1.size:]

    Parameters
    ----------
    computation_graph : :class:`ComputationGraph` instance
        The managed Theano graph in which to collect parameters.
    parameters : list of Theano shared variables
        The parameters whose values should be collected.

    Returns
    -------
    ComputationGraph instance
        A new Theano graph which has all the given parameters collected
        into a single large shared variable.

    Notes
    -----
    Note that this replacement makes the training of the model
    significantly slower because of the large amount of Theano's
    ``set_subtensor`` calls needed to train the model.

    Examples
    --------
    >>> from blocks.bricks import MLP, Logistic
    >>> from blocks.bricks.cost import SquaredError
    >>> from theano import tensor
    >>> x = tensor.matrix()
    >>> mlp = MLP(activations=[Logistic(), Logistic()],
    ...           dims=[784, 100, 784])
    >>> cost = SquaredError().apply(x, mlp.apply(x))
    >>> cg = ComputationGraph(cost)
    >>> new_cg = collect_parameters(cg, cg.shared_variables)

    The new graph only has a single shared variable. This variable receives
    the :const:`COLLECTOR` role.

    >>> new_cg.shared_variables
    [collected_parameters]

    The bricks' variables have been replaced with reshaped segments of this
    single shared variable. These replacements are given the
    :const:`.COLLECTED` role.

    >>> from blocks.filter import VariableFilter
    >>> from blocks.roles import PARAMETER
    >>> var_filter = VariableFilter(roles=[COLLECTED])
    >>> var_filter(new_cg.variables)  # doctest: +SKIP
    [Reshape{1}.0, Reshape{1}.0, Reshape{2}.0, Reshape{2}.0]

    """
    parameter_values, parameter_sizes, parameter_shapes = [], [], []
    for parameter in parameters:
        parameter_values.append(parameter.get_value(borrow=True))
        parameter_sizes.append(parameter_values[-1].size)
        parameter_shapes.append(parameter_values[-1].shape)

    new_parameters = shared_floatx_zeros(sum(parameter_sizes))
    new_parameters.set_value(numpy.concatenate([value.flatten()
                             for value in parameter_values]))
    new_parameters.name = 'collected_parameters'
    add_role(new_parameters, COLLECTOR)

    replacements = {}
    for parameter, shape, i, j in zip(parameters, parameter_shapes,
                                      numpy.cumsum([0] + parameter_sizes[:-1]),
                                      numpy.cumsum(parameter_sizes)):
        new_parameter = new_parameters[i:j].reshape(shape)
        new_parameter.replacement_of = parameter
        add_role(new_parameter, COLLECTED)
        replacements[parameter] = new_parameter
    return computation_graph.replace(replacements)


def apply_dropout(computation_graph, variables, drop_prob, rng=None,
                  seed=None, custom_divisor=None):
    """Apply dropout to specified variables in a graph.

    Parameters
    ----------
    computation_graph : instance of :class:`ComputationGraph`
        The computation graph.
    variables : list of :class:`~tensor.TensorVariable`
        Variables to be dropped out.
    drop_prob : float
        Probability of dropping out. If you want to apply the dropout
        with different probabilities for different layers, call it
        several times.
    rng : :class:`~theano.sandbox.rng_mrg.MRG_RandomStreams`
        Random number generator.
    seed : int
        Random seed to be used if `rng` was not specified.
    custom_divisor : float or None, optional
        Divide dropped variables by a given scalar value. If `None`,
        (default) dropped variables will be divided by `(1 - drop_prob)`
        which is equivalent to scaling by `(1 - drop_prob)` at test
        time as recommended in [DROPOUT]_.

    Returns
    -------
    dropped_computation_graph : instance of :class:`ComputationGraph`
        A new computation graph with dropout applied to the specified
        variables. In order to train with, or monitor, the outputs
        of the original computation graph with dropout applies, use
        the variables contained in `dropped_computation_graph.outputs`.

    Notes
    -----
    For more information, see [DROPOUT]_.

    .. [DROPOUT] Hinton et al. *Improving neural networks by preventing
       co-adaptation of feature detectors*, arXiv:1207.0580.

    Examples
    --------
    >>> import numpy
    >>> from theano import tensor, function
    >>> from blocks.bricks import MLP, Identity
    >>> from blocks.filter import VariableFilter
    >>> from blocks.initialization import Constant
    >>> from blocks.roles import INPUT
    >>> linear = MLP([Identity(), Identity()], [2, 10, 2],
    ...              weights_init=Constant(1), biases_init=Constant(2))
    >>> x = tensor.matrix('x')
    >>> y = linear.apply(x)
    >>> cg = ComputationGraph(y)

    We are going to drop out all the input variables

    >>> inputs = VariableFilter(roles=[INPUT])(cg.variables)

    Here we apply dropout with default setting to our computation graph

    >>> cg_dropout = apply_dropout(cg, inputs, 0.5)

    Dropped out variables have role `DROPOUT` and are tagged with
    `replacement_of` tag. Let's filter these variables and check if they
    have the links to original ones.

    >>> dropped_out = VariableFilter(roles=[DROPOUT])(cg_dropout.variables)
    >>> inputs_referenced = [var.tag.replacement_of for var in dropped_out]
    >>> set(inputs) == set(inputs_referenced)
    True

    Compiling theano functions to forward propagate in original and dropped
    out graphs

    >>> fprop = function(cg.inputs, cg.outputs[0])
    >>> fprop_dropout = function(cg_dropout.inputs, cg_dropout.outputs[0])

    Initialize an MLP and apply these functions

    >>> linear.initialize()
    >>> fprop(numpy.ones((3, 2),
    ...       dtype=theano.config.floatX))  # doctest:+ELLIPSIS
    array([[ 42.,  42.],
           [ 42.,  42.],
           [ 42.,  42.]]...
    >>> fprop_dropout(numpy.ones((3, 2),
    ...               dtype=theano.config.floatX))  # doctest:+ELLIPSIS
    array([[ 0.,  0.],
           [ 0.,  0.],
           [ 0.,  0.]]...

    And after the second run answer is different

    >>> fprop_dropout(numpy.ones((3, 2),
    ...               dtype=theano.config.floatX))  # doctest:+ELLIPSIS
    array([[   0.,   52.],
           [ 100.,    0.],
           [   0.,    0.]]...

    """
    if not rng and not seed:
        seed = config.default_seed
    if not rng:
        rng = MRG_RandomStreams(seed)
    if custom_divisor is None:
        divisor = (1 - drop_prob)
    else:
        divisor = custom_divisor
    replacements = [(var, var *
                     rng.binomial(var.shape, p=1 - drop_prob,
                                  dtype=theano.config.floatX) /
                     divisor)
                    for var in variables]
    for variable, replacement in replacements:
        add_role(replacement, DROPOUT)
        replacement.tag.replacement_of = variable

    return computation_graph.replace(replacements)


1			"""Annotated computation graph management."""
2			import logging
3			from collections import OrderedDict
4			from itertools import chain
5			import warnings
6
7			import numpy
8			import theano
9			from picklable_itertools.extras import equizip
10			from theano import Variable
11			from theano.gof import graph
12			from theano.sandbox.rng_mrg import MRG_RandomStreams
13			from theano.scan_module.scan_op import Scan
14			from toolz import unique
15
16			from ..config import config
17			from ..roles import (add_role, has_roles, AUXILIARY, PARAMETER, DROPOUT,
18			COLLECTED, COLLECTOR)
19			from ..utils import (is_graph_input, is_shared_variable, dict_union,
20			shared_floatx_zeros, shared_like)
21			from .annotations import add_annotation, Annotation # noqa
22			from .bn import batch_normalization, apply_batch_normalization # noqa
23
24			logger = logging.getLogger(__name__)
25
26
27			class ComputationGraph(object):
28			r"""Encapsulates a managed Theano computation graph.
29
30			This implies that it not only contains the variables required to
31			compute the given outputs, but also all the auxiliary variables and
32			updates that were attached to these variables through the annotation
33			system.
34
35			All variables are presented in topologically sorted order according to
36			the apply nodes that they are an input to.
37
38			Parameters
39			----------
40			outputs : (list of) :class:`~tensor.TensorVariable`
41			The output(s) of the computation graph.
42
43			Attributes
44			----------
45			inputs : list of :class:`~tensor.TensorVariable`
46			The inputs of the computation graph. This does not include shared
47			variables and constants.
48			shared_variables : list of :class:`~tensor.TensorSharedVariable`
49			All the shared variables in the graph.
50			parameters : list of :class:`~tensor.TensorSharedVariable`
51			All the shared variables which have the :const:`.PARAMETER` role.
52			outputs : list of :class:`~tensor.TensorVariable`
53			The outputs of the computations graph (as passed to the
54			constructor).
55			auxiliary_variables : list of :class:`~tensor.TensorVariable`
56			All variables which have the :const:`.AUXILIARY` role.
57			intermediary_variables : list of :class:`~tensor.TensorVariable`
58			Any variable that is not part of :attr:`inputs` or :attr:`outputs`.
59			variables : list of :class:`~tensor.TensorVariable`
60			All variables (including auxiliary) in the managed graph.
61			scans : list of :class:`~theano.scan_module.scan_op.Scan`
62			All Scan ops used in this computation graph.
63			scan_variables : list of :class:`~tensor.TensorVariable`
64			All variables of the inner graphs of Scan ops.
65			updates : :class:`~tensor.TensorSharedVariable` updates
66			All the updates found attached to the annotations.
67
68			"""
69			def __init__(self, outputs):
70			if isinstance(outputs, Variable):
71			outputs = [outputs]
72			self.outputs = outputs
73			self._get_variables()
74			self._has_inputs = {}
75
76			def __iter__(self):
77			return iter(self.variables)
78
79			@property
80			def inputs(self):
81			"""Inputs to the graph, excluding constants and shared variables."""
82			return [var for var in self.variables if is_graph_input(var)]
83
84			@property
85			def intermediary_variables(self):
86			return [var for var in self.variables if
87			var not in self.inputs and
88			var not in self.outputs]
89
90			@property
91			def shared_variables(self):
92			return [var for var in self.variables if is_shared_variable(var)]
93
94			@property
95			def parameters(self):
96			return [var for var in self.shared_variables
97			if has_roles(var, [PARAMETER])]
98
99			@property
100			def auxiliary_variables(self):
101			return [var for var in self.variables if has_roles(var, [AUXILIARY])]
102
103			@property
104			def scan_variables(self):
105			"""Variables of Scan ops."""
106			return list(chain(*[g.variables for g in self._scan_graphs]))
107
108			def _get_variables(self):
109			"""Collect variables, updates and auxiliary variables.
110
111			In addition collects all :class:`.Scan` ops and recurses in the
112			respective inner Theano graphs.
113
114			"""
115			updates = OrderedDict()
116
117			shared_outputs = [o for o in self.outputs if is_shared_variable(o)]
118			usual_outputs = [o for o in self.outputs if not is_shared_variable(o)]
119			variables = shared_outputs
120
121			if usual_outputs:
122			# Sort apply nodes topologically, get variables and remove
123			# duplicates
124			inputs = graph.inputs(self.outputs)
125			sorted_apply_nodes = graph.io_toposort(inputs, usual_outputs)
126			self.scans = list(unique([node.op for node in sorted_apply_nodes
127			if isinstance(node.op, Scan)]))
128			self._scan_graphs = [ComputationGraph(scan.outputs)
129			for scan in self.scans]
130
131			seen = set()
132			main_vars = (
133			[var for var in list(chain(
134			*[apply_node.inputs for apply_node in sorted_apply_nodes]))
135			if not (var in seen or seen.add(var))] +
136			[var for var in self.outputs if var not in seen])
137
138			# While preserving order add auxiliary variables, and collect
139			# updates
140			seen = set()
141			# Intermediate variables could be auxiliary
142			seen_avs = set(main_vars)
143			variables = []
144			for var in main_vars:
145			variables.append(var)
146			for annotation in getattr(var.tag, 'annotations', []):
147			if annotation not in seen:
148			seen.add(annotation)
149			new_avs = [
150			av for av in annotation.auxiliary_variables
151			if not (av in seen_avs or seen_avs.add(av))]
152			variables.extend(new_avs)
153			updates = dict_union(updates, annotation.updates)
154
155			self.variables = variables
156			self.updates = updates
157
158			def dict_of_inputs(self):
159			"""Return a mapping from an input name to the input."""
160			return {var.name: var for var in self.inputs}
161
162			def replace(self, replacements):
163			"""Replace certain variables in the computation graph.
164
165			Parameters
166			----------
167			replacements : dict
168			The mapping from variables to be replaced to the corresponding
169			substitutes.
170
171			Examples
172			--------
173			>>> import theano
174			>>> from theano import tensor, function
175			>>> x = tensor.scalar('x')
176			>>> y = x + 2
177			>>> z = y + 3
178			>>> a = z + 5
179
180			Let's suppose we have dependent replacements like
181
182			>>> replacements = {y: x * 2, z: y * 3}
183			>>> cg = ComputationGraph([a])
184			>>> theano.pprint(a) # doctest: +NORMALIZE_WHITESPACE
185			'(((x + TensorConstant{2}) + TensorConstant{3}) +
186			TensorConstant{5})'
187			>>> cg_new = cg.replace(replacements)
188			>>> theano.pprint(
189			... cg_new.outputs[0]) # doctest: +NORMALIZE_WHITESPACE
190			'(((x * TensorConstant{2}) * TensorConstant{3}) +
191			TensorConstant{5})'
192
193			First two sums turned into multiplications
194
195			>>> float(function(cg_new.inputs, cg_new.outputs)(3.)[0])
196			23.0
197
198			"""
199			# Due to theano specifics we have to make one replacement in time
200			replacements = OrderedDict(replacements)
201
202			outputs_cur = self.outputs
203
204			# `replacements` with previous replacements applied. We have to track
205			# variables in the new graph corresponding to original replacements.
206			replacement_keys_cur = []
207			replacement_vals_cur = []
208			# Sort `replacements` in topological order
209			# variables in self.variables are in topological order
210			remaining_replacements = replacements.copy()
211			for variable in self.variables:
212			if variable in replacements:
213			if has_roles(variable, [AUXILIARY]):
214			warnings.warn(
215			"replace method was asked to replace a variable ({}) "
216			"that is an auxiliary variable.".format(variable))
217			replacement_keys_cur.append(variable)
218			# self.variables should not contain duplicates,
219			# otherwise pop() may fail.
220			replacement_vals_cur.append(
221			remaining_replacements.pop(variable))
222
223			# if remaining_replacements is not empty
224			if remaining_replacements:
225			warnings.warn(
226			"replace method was asked to replace a variable(s) ({}) "
227			"that is not a part of the computational "
228			"graph.".format(str(remaining_replacements.keys())))
229
230			# Replace step-by-step in topological order
231			while replacement_keys_cur:
232			replace_what = replacement_keys_cur[0]
233			replace_by = replacement_vals_cur[0]
234			# We also want to make changes in future replacements
235			outputs_new = theano.clone(
236			outputs_cur + replacement_keys_cur[1:] +
237			replacement_vals_cur[1:],
238			replace={replace_what: replace_by})
239			# Reconstruct outputs, keys, and values
240			outputs_cur = outputs_new[:len(outputs_cur)]
241			replacement_keys_cur = outputs_new[len(outputs_cur):
242			len(outputs_cur) +
243			len(replacement_keys_cur) - 1]
244			replacement_vals_cur = outputs_new[len(outputs_cur) +
245			len(replacement_keys_cur):]
246
247			return ComputationGraph(outputs_cur)
248
249			def get_theano_function(self, additional_updates=None, **kwargs):
250			r"""Create Theano function from the graph contained.
251
252			Parameters
253			----------
254			\\kwargs : dict
255			Keyword arguments to theano.function.
256			Useful for specifying compilation modes or profiling.
257
258			"""
259			updates = self.updates
260			if additional_updates:
261			updates = dict_union(updates, OrderedDict(additional_updates))
262			return theano.function(self.inputs, self.outputs, updates=updates,
263			**kwargs)
264
265			def get_snapshot(self, data):
266			"""Evaluate all role-carrying Theano variables on given data.
267
268			Parameters
269			----------
270			data : dict of (data source, data) pairs
271			Data for input variables. The sources should match with the
272			names of the input variables.
273
274			Returns
275			-------
276			Dictionary of (variable, variable value on given data) pairs.
277
278			"""
279			role_variables = [var for var in self.variables
280			if hasattr(var.tag, "roles") and
281			not is_shared_variable(var)]
282			value_holders = [shared_like(var) for var in role_variables]
283			function = self.get_theano_function(equizip(value_holders,
284			role_variables))
285			function(*(data[input_.name] for input_ in self.inputs))
286			return OrderedDict([(var, value_holder.get_value(borrow=True))
287			for var, value_holder in equizip(role_variables,
288			value_holders)])
289
290			def has_inputs(self, variable):
291			"""Check if a variable depends on input variables.
292
293			Returns
294			-------
295			bool
296			``True`` if the given variable depends on input variables,
297			``False`` otherwise.
298
299			"""
300			if variable not in self._has_inputs:
301			self._has_inputs[variable] = False
302			if is_graph_input(variable):
303			self._has_inputs[variable] = True
304			elif getattr(variable, 'owner', None):
305			for dependancy in variable.owner.inputs:
306			if self.has_inputs(dependancy):
307			self._has_inputs[variable] = True
308			return self._has_inputs[variable]
309
310
311			def apply_noise(computation_graph, variables, level, seed=None):
312			"""Add Gaussian noise to certain variable of a computation graph.
313
314			Parameters
315			----------
316			computation_graph : instance of :class:`ComputationGraph`
317			The computation graph.
318			variables : :class:`~tensor.TensorVariable`
319			Variables to add noise to.
320			level : float
321			Noise level.
322			seed : int, optional
323			The seed with which
324			:class:`~theano.sandbox.rng_mrg.MRG_RandomStreams` is initialized,
325			is set to 1 by default.
326
327			"""
328			if not seed:
329			seed = config.default_seed
330			rng = MRG_RandomStreams(seed)
331			replace = {}
332			for variable in variables:
333			replace[variable] = (variable +
334			rng.normal(variable.shape, std=level))
335			return computation_graph.replace(replace)
336
337
338			def collect_parameters(computation_graph, parameters):
339			"""Replace parameters with a single shared variable.
340
341			This can be useful if you need to calculate the full Hessian of a
342			computational graph. It replaces parameters with slices of a single
343			large vectors like
344
345			>>> from blocks.utils import shared_floatx
346			>>> W1 = shared_floatx(numpy.random.rand(10, 10))
347			>>> W2 = shared_floatx(numpy.random.rand(10, 10))
348			>>> all_parameters = shared_floatx(numpy.concatenate(
349			... [W1.get_value().flatten(), W2.get_value().flatten()]))
350			>>> W1 = all_parameters[:W1.size]
351			>>> W2 = all_parameters[W1.size:]
352
353			Parameters
354			----------
355			computation_graph : :class:`ComputationGraph` instance
356			The managed Theano graph in which to collect parameters.
357			parameters : list of Theano shared variables
358			The parameters whose values should be collected.
359
360			Returns
361			-------
362			ComputationGraph instance
363			A new Theano graph which has all the given parameters collected
364			into a single large shared variable.
365
366			Notes
367			-----
368			Note that this replacement makes the training of the model
369			significantly slower because of the large amount of Theano's
370			``set_subtensor`` calls needed to train the model.
371
372			Examples
373			--------
374			>>> from blocks.bricks import MLP, Logistic
375			>>> from blocks.bricks.cost import SquaredError
376			>>> from theano import tensor
377			>>> x = tensor.matrix()
378			>>> mlp = MLP(activations=[Logistic(), Logistic()],
379			... dims=[784, 100, 784])
380			>>> cost = SquaredError().apply(x, mlp.apply(x))
381			>>> cg = ComputationGraph(cost)
382			>>> new_cg = collect_parameters(cg, cg.shared_variables)
383
384			The new graph only has a single shared variable. This variable receives
385			the :const:`COLLECTOR` role.
386
387			>>> new_cg.shared_variables
388			[collected_parameters]
389
390			The bricks' variables have been replaced with reshaped segments of this
391			single shared variable. These replacements are given the
392			:const:`.COLLECTED` role.
393
394			>>> from blocks.filter import VariableFilter
395			>>> from blocks.roles import PARAMETER
396			>>> var_filter = VariableFilter(roles=[COLLECTED])
397			>>> var_filter(new_cg.variables) # doctest: +SKIP
398			[Reshape{1}.0, Reshape{1}.0, Reshape{2}.0, Reshape{2}.0]
399
400			"""
401			parameter_values, parameter_sizes, parameter_shapes = [], [], []
402			for parameter in parameters:
403			parameter_values.append(parameter.get_value(borrow=True))
404			parameter_sizes.append(parameter_values[-1].size)
405			parameter_shapes.append(parameter_values[-1].shape)
406
407			new_parameters = shared_floatx_zeros(sum(parameter_sizes))
408			new_parameters.set_value(numpy.concatenate([value.flatten()
409			for value in parameter_values]))
410			new_parameters.name = 'collected_parameters'
411			add_role(new_parameters, COLLECTOR)
412
413			replacements = {}
414			for parameter, shape, i, j in zip(parameters, parameter_shapes,
415			numpy.cumsum([0] + parameter_sizes[:-1]),
416			numpy.cumsum(parameter_sizes)):
417			new_parameter = new_parameters[i:j].reshape(shape)
418			new_parameter.replacement_of = parameter
419			add_role(new_parameter, COLLECTED)
420			replacements[parameter] = new_parameter
421			return computation_graph.replace(replacements)
422
423
424			def apply_dropout(computation_graph, variables, drop_prob, rng=None,
425			seed=None, custom_divisor=None):
426			"""Apply dropout to specified variables in a graph.
427
428			Parameters
429			----------
430			computation_graph : instance of :class:`ComputationGraph`
431			The computation graph.
432			variables : list of :class:`~tensor.TensorVariable`
433			Variables to be dropped out.
434			drop_prob : float
435			Probability of dropping out. If you want to apply the dropout
436			with different probabilities for different layers, call it
437			several times.
438			rng : :class:`~theano.sandbox.rng_mrg.MRG_RandomStreams`
439			Random number generator.
440			seed : int
441			Random seed to be used if `rng` was not specified.
442			custom_divisor : float or None, optional
443			Divide dropped variables by a given scalar value. If `None`,
444			(default) dropped variables will be divided by `(1 - drop_prob)`
445			which is equivalent to scaling by `(1 - drop_prob)` at test
446			time as recommended in [DROPOUT]_.
447
448			Returns
449			-------
450			dropped_computation_graph : instance of :class:`ComputationGraph`
451			A new computation graph with dropout applied to the specified
452			variables. In order to train with, or monitor, the outputs
453			of the original computation graph with dropout applies, use
454			the variables contained in `dropped_computation_graph.outputs`.
455
456			Notes
457			-----
458			For more information, see [DROPOUT]_.
459
460			.. [DROPOUT] Hinton et al. *Improving neural networks by preventing
461			co-adaptation of feature detectors*, arXiv:1207.0580.
462
463			Examples
464			--------
465			>>> import numpy
466			>>> from theano import tensor, function
467			>>> from blocks.bricks import MLP, Identity
468			>>> from blocks.filter import VariableFilter
469			>>> from blocks.initialization import Constant
470			>>> from blocks.roles import INPUT
471			>>> linear = MLP([Identity(), Identity()], [2, 10, 2],
472			... weights_init=Constant(1), biases_init=Constant(2))
473			>>> x = tensor.matrix('x')
474			>>> y = linear.apply(x)
475			>>> cg = ComputationGraph(y)
476
477			We are going to drop out all the input variables
478
479			>>> inputs = VariableFilter(roles=[INPUT])(cg.variables)
480
481			Here we apply dropout with default setting to our computation graph
482
483			>>> cg_dropout = apply_dropout(cg, inputs, 0.5)
484
485			Dropped out variables have role `DROPOUT` and are tagged with
486			`replacement_of` tag. Let's filter these variables and check if they
487			have the links to original ones.
488
489			>>> dropped_out = VariableFilter(roles=[DROPOUT])(cg_dropout.variables)
490			>>> inputs_referenced = [var.tag.replacement_of for var in dropped_out]
491			>>> set(inputs) == set(inputs_referenced)
492			True
493
494			Compiling theano functions to forward propagate in original and dropped
495			out graphs
496
497			>>> fprop = function(cg.inputs, cg.outputs[0])
498			>>> fprop_dropout = function(cg_dropout.inputs, cg_dropout.outputs[0])
499
500			Initialize an MLP and apply these functions
501
502			>>> linear.initialize()
503			>>> fprop(numpy.ones((3, 2),
504			... dtype=theano.config.floatX)) # doctest:+ELLIPSIS
505			array([[ 42., 42.],
506			[ 42., 42.],
507			[ 42., 42.]]...
508			>>> fprop_dropout(numpy.ones((3, 2),
509			... dtype=theano.config.floatX)) # doctest:+ELLIPSIS
510			array([[ 0., 0.],
511			[ 0., 0.],
512			[ 0., 0.]]...
513
514			And after the second run answer is different
515
516			>>> fprop_dropout(numpy.ones((3, 2),
517			... dtype=theano.config.floatX)) # doctest:+ELLIPSIS
518			array([[ 0., 52.],
519			[ 100., 0.],
520			[ 0., 0.]]...
521
522			"""
523			if not rng and not seed:
524			seed = config.default_seed
525			if not rng:
526			rng = MRG_RandomStreams(seed)
527			if custom_divisor is None:
528			divisor = (1 - drop_prob)
529			else:
530			divisor = custom_divisor
531			replacements = [(var, var *
532			rng.binomial(var.shape, p=1 - drop_prob,
533			dtype=theano.config.floatX) /
534			divisor)
535			for var in variables]
536			for variable, replacement in replacements:
537			add_role(replacement, DROPOUT)
538			replacement.tag.replacement_of = variable
539
540			return computation_graph.replace(replacements)
541

mila-udem / blocks

Pull Request — master (#941)

blocks.graph.ComputationGraph F

Complexity

Size/Duplication

14 Methods

How to fix Complexity

Complex Class

Duplication Side-by-Side

Filter issues like