tensorflow/python/ops/control_flow_util_v2.py - platform/external/tensorflow - Git at Google

 # Copyright 2018 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================

 """Utilties for V2 control flow."""

 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

 from tensorflow.core.framework import attr_value_pb2
 from tensorflow.python.distribute import distribution_strategy_context
 from tensorflow.python.eager import context
 from tensorflow.python.eager import function
 from tensorflow.python.framework import ops
 from tensorflow.python.framework.func_graph import FuncGraph
 from tensorflow.python.keras.engine import base_layer_utils
 from tensorflow.python.ops import control_flow_util
 from tensorflow.python.ops import control_flow_v2_func_graphs
 from tensorflow.python.util import tf_contextlib

 _EXPERIMENTAL_OUTPUT_ALL_INTERMEDIATES_OVERRIDE = None

 CondBranchFuncGraph = control_flow_v2_func_graphs.CondBranchFuncGraph
 WhileCondFuncGraph = control_flow_v2_func_graphs.WhileCondFuncGraph
 WhileBodyFuncGraph = control_flow_v2_func_graphs.WhileBodyFuncGraph


 def in_defun():
   """Returns if the current graph is, or is nested in, a defun."""
   if context.executing_eagerly(): return False

   graph = ops.get_default_graph()
   while (isinstance(graph, CondBranchFuncGraph) or
          isinstance(graph, WhileBodyFuncGraph)):
     graph = graph.outer_graph
   return isinstance(graph, FuncGraph)


 def create_new_tf_function(func_graph):
   """Converts func_graph to a TF_Function and adds it to the current graph.

   Args:
     func_graph: FuncGraph

   Returns:
     The name of the new TF_Function.
   """
   func = function._EagerDefinedFunction(  # pylint: disable=protected-access
       func_graph.name, func_graph, func_graph.inputs, func_graph.outputs, {})
   func.add_to_graph(func_graph.outer_graph)
   return func_graph.name


 def unique_fn_name(scope, name):
   """Returns a unique name to use for a control flow function.

   Args:
     scope: A name scope string.
     name: An identifier for this function (e.g. "true", "body").

   Returns:
     A string, the name to use for the function.
   """
   return ("%s%s_%s" % (scope, name, ops.uid())).replace("/", "_")


 def unique_grad_fn_name(forward_name):
   return "%s_grad_%s" % (forward_name, ops.uid())


 def maybe_set_lowering_attr(op):
   """Sets the flag to enable lowering on `op` if necessary.

   Lowering allows cond_v2 and while_v2 to avoid some of the limitations of
   Functions, allowing users to specify devices & colocation inside of cond_v2
   and while_v2 input functions, and enabling non-strict evaluation & partial
   pruning. This brings v2 control flow closer to feature parity with v1 control
   flow.

   However, we do not lower in the following cases:
     - When the `If` or `While` ops are in the XLA context. Because it is easier
       for XLA to apply its own optimizations when dealing with un-lowered
       control flow operators than with low-level control flow primitives.
     - When the eager execution context specifies the executor of functions to
       be the single threaded executor (see context.function_executor_type()).
       Because the single threaded executor does not support v1 control flow ops.

   Args:
     op: An `If` or `While` Operation.
   """
   if (not control_flow_util.GraphOrParentsInXlaContext(op.graph) and
       context.context().function_call_options.executor_type !=
       "SINGLE_THREADED_EXECUTOR"):
     # pylint: disable=protected-access
     op._set_attr("_lower_using_switch_merge", attr_value_pb2.AttrValue(b=True))
     # pylint: enable=protected-access


 def maybe_propagate_compile_time_consts_in_xla(op):
   """Tells XLA whether to propagate compile-time consts in the loop body.

   This is needed to make compile time constants available to ops, for example
   `max_num_elements` in `EmptyTensorList`, inside the loop body. Ideally this
   would always be turned on, but that doesn't work with legacy functionalized
   while_loops.

   Args:
     op: A `While` Operation.
   """
   if control_flow_util.GraphOrParentsInXlaContext(op.graph):
     # pylint: disable=protected-access
     op._set_attr("_xla_propagate_compile_time_consts",
                  attr_value_pb2.AttrValue(b=True))
     # pylint: enable=protected-access


 def resource_input_index(tensor_name, input_names, node_defs, functions):
   """Returns the index of the input corresponding to `tensor_name`.

   This method is used to find the corresponding index of an arbitrary resource
   tensor in a function (the function could be a loop body). We assume that
   resource handles are never created in functions, so that every resource
   tensor can be traced back to a function input.

   The awkward signature of this method is to make it work with both FuncGraphs
   and FunctionDefs. This is so we can recurse on function call ops without
   building the corresponding FuncGraph (note that even if a FuncGraph for a
   FunctionDef already exists, the input/output/node names may have been
   changed when the FuncGraph was serialized to the FunctionDef, which makes it
   unusable with this algorithm).

   Args:
     tensor_name: the name of the resource tensor to be resolved to an input.
     input_names: a list of the names of all inputs to the function.
     node_defs: a dict mapping op name -> NodeDef for every op in the function.
     functions: a dict mapping function name -> _EagerDefinedFunction.

   Returns:
     The index into input_names corresponding to `tensor_name`.
   """
   while tensor_name not in input_names:
     # FunctionDefs and graphs use different tensor naming conventions.
     parts = tensor_name.split(":")
     if len(parts) == 3:
       op_name, _, output_idx = parts
     elif len(parts) == 2:
       op_name, output_idx = parts
     else:
       assert len(parts) == 1
       op_name = parts[0]
       output_idx = 0
     output_idx = int(output_idx)
     node_def = node_defs[op_name]

     if node_def.op == "While":
       # Captured resources occur at the same index in the lists of inputs and
       # outputs of a while op. So we lookup the input of `tensor.op` at the
       # same index as the index of `tensor` in the `tensor.op.outputs`.
       tensor_name = node_def.input[output_idx]
     elif node_def.op in ("PartitionedCall", "StatefulPartitionedCall"):
       # Functions output any captured resource tensors used by their
       # gradients.  `tensor_name` is one of these outputs from a nested
       # function call, so recursively find the corresponding input in the
       # nested FunctionDef.
       func_name = node_def.attr["f"].func.name
       fdef = functions[func_name].definition
       output_arg_name = fdef.signature.output_arg[output_idx].name
       output_tensor_name = fdef.ret[output_arg_name]
       input_index = resource_input_index(
           output_tensor_name, [arg.name for arg in fdef.signature.input_arg],
           {ndef.name: ndef for ndef in fdef.node_def}, functions)
       tensor_name = node_def.input[input_index]
     else:
       # We assume there are no other ops types that will "forward" resource
       # handles like this, so all other handles must have been created by the
       # op. (Note that cond_v2 wraps resource handle outputs in optionals,
       # which we'll end up accumulating).
       raise ValueError("Taking gradient of a while loop which creates "
                        "a resource in its body is not supported: %s" % op_name)

   return input_names.index(tensor_name)


 @tf_contextlib.contextmanager
 def clear_control_inputs():
   """Clears the control inputs but preserves the ControlFlowContext.

   This is needed to preserve the XLAControlFlowControl when clearing
   control inputs for the gradient accumulators in while_v2.
   `ops.control_dependencies` does not allow that.

   Yields:
     A context manager in which the ops created will not have any control inputs
     by default but the control flow context is the same.
   """
   # pylint: disable=protected-access
   control_flow_context = ops.get_default_graph()._get_control_flow_context()
   with ops.control_dependencies(None):
     ops.get_default_graph()._set_control_flow_context(control_flow_context)
     yield
   # pylint: enable=protected-access


 def _is_tpu_strategy(strategy):
   return (strategy is not None and
           strategy.__class__.__name__.startswith("TPUStrategy"))


 def _is_building_keras_layer():
   return base_layer_utils.call_context().layer is not None


 def output_all_intermediates():
   """Whether to output all intermediates of a functional control flow op.

   The default behavior is to output intermediates only when building a Keras
   Layer in graph mode and that too when certain other conditions are met:
   1. We do not output intermediates if the functional control flow op
      is being built inside a FuncGraph which is not a If/While graph. This
      guards against outputting intermediates in eager mode since keras adds
      tensors to a FuncGraph named "keras_graph" in that case. Also because we
      do not output intermediates of tf.function (since this feature is only for
      backwards compatibility) outputting intermediates of functional control
      flow ops built inside tf.function is of no value.
   2. We do not output intermediates when the compilation is using XLA or for a
      TPU.
   3. We do not output intermediates when a single threaded executor is used
      since that does not perform inlining and pruning.

   Returns:
     A bool telling whether to output all intermediates.
   """
   if _EXPERIMENTAL_OUTPUT_ALL_INTERMEDIATES_OVERRIDE is not None:
     return _EXPERIMENTAL_OUTPUT_ALL_INTERMEDIATES_OVERRIDE
   if in_defun():
     return False
   if (control_flow_util.GraphOrParentsInXlaContext(ops.get_default_graph()) or
       _is_tpu_strategy(distribution_strategy_context.get_strategy())):
     return False
   if (context.context().function_call_options.executor_type ==
       "SINGLE_THREADED_EXECUTOR"):
     return False
   return _is_building_keras_layer()
	# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# ==============================================================================

	"""Utilties for V2 control flow."""

	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function

	from tensorflow.core.framework import attr_value_pb2
	from tensorflow.python.distribute import distribution_strategy_context
	from tensorflow.python.eager import context
	from tensorflow.python.eager import function
	from tensorflow.python.framework import ops
	from tensorflow.python.framework.func_graph import FuncGraph
	from tensorflow.python.keras.engine import base_layer_utils
	from tensorflow.python.ops import control_flow_util
	from tensorflow.python.ops import control_flow_v2_func_graphs
	from tensorflow.python.util import tf_contextlib

	_EXPERIMENTAL_OUTPUT_ALL_INTERMEDIATES_OVERRIDE = None

	CondBranchFuncGraph = control_flow_v2_func_graphs.CondBranchFuncGraph
	WhileCondFuncGraph = control_flow_v2_func_graphs.WhileCondFuncGraph
	WhileBodyFuncGraph = control_flow_v2_func_graphs.WhileBodyFuncGraph


	def in_defun():
	"""Returns if the current graph is, or is nested in, a defun."""
	if context.executing_eagerly(): return False

	graph = ops.get_default_graph()
	while (isinstance(graph, CondBranchFuncGraph) or
	isinstance(graph, WhileBodyFuncGraph)):
	graph = graph.outer_graph
	return isinstance(graph, FuncGraph)


	def create_new_tf_function(func_graph):
	"""Converts func_graph to a TF_Function and adds it to the current graph.

	Args:
	func_graph: FuncGraph

	Returns:
	The name of the new TF_Function.
	"""
	func = function._EagerDefinedFunction( # pylint: disable=protected-access
	func_graph.name, func_graph, func_graph.inputs, func_graph.outputs, {})
	func.add_to_graph(func_graph.outer_graph)
	return func_graph.name


	def unique_fn_name(scope, name):
	"""Returns a unique name to use for a control flow function.

	Args:
	scope: A name scope string.
	name: An identifier for this function (e.g. "true", "body").

	Returns:
	A string, the name to use for the function.
	"""
	return ("%s%s_%s" % (scope, name, ops.uid())).replace("/", "_")


	def unique_grad_fn_name(forward_name):
	return "%s_grad_%s" % (forward_name, ops.uid())


	def maybe_set_lowering_attr(op):
	"""Sets the flag to enable lowering on `op` if necessary.

	Lowering allows cond_v2 and while_v2 to avoid some of the limitations of
	Functions, allowing users to specify devices & colocation inside of cond_v2
	and while_v2 input functions, and enabling non-strict evaluation & partial
	pruning. This brings v2 control flow closer to feature parity with v1 control
	flow.

	However, we do not lower in the following cases:
	- When the `If` or `While` ops are in the XLA context. Because it is easier
	for XLA to apply its own optimizations when dealing with un-lowered
	control flow operators than with low-level control flow primitives.
	- When the eager execution context specifies the executor of functions to
	be the single threaded executor (see context.function_executor_type()).
	Because the single threaded executor does not support v1 control flow ops.

	Args:
	op: An `If` or `While` Operation.
	"""
	if (not control_flow_util.GraphOrParentsInXlaContext(op.graph) and
	context.context().function_call_options.executor_type !=
	"SINGLE_THREADED_EXECUTOR"):
	# pylint: disable=protected-access
	op._set_attr("_lower_using_switch_merge", attr_value_pb2.AttrValue(b=True))
	# pylint: enable=protected-access


	def maybe_propagate_compile_time_consts_in_xla(op):
	"""Tells XLA whether to propagate compile-time consts in the loop body.

	This is needed to make compile time constants available to ops, for example
	`max_num_elements` in `EmptyTensorList`, inside the loop body. Ideally this
	would always be turned on, but that doesn't work with legacy functionalized
	while_loops.

	Args:
	op: A `While` Operation.
	"""
	if control_flow_util.GraphOrParentsInXlaContext(op.graph):
	# pylint: disable=protected-access
	op._set_attr("_xla_propagate_compile_time_consts",
	attr_value_pb2.AttrValue(b=True))
	# pylint: enable=protected-access


	def resource_input_index(tensor_name, input_names, node_defs, functions):
	"""Returns the index of the input corresponding to `tensor_name`.

	This method is used to find the corresponding index of an arbitrary resource
	tensor in a function (the function could be a loop body). We assume that
	resource handles are never created in functions, so that every resource
	tensor can be traced back to a function input.

	The awkward signature of this method is to make it work with both FuncGraphs
	and FunctionDefs. This is so we can recurse on function call ops without
	building the corresponding FuncGraph (note that even if a FuncGraph for a
	FunctionDef already exists, the input/output/node names may have been
	changed when the FuncGraph was serialized to the FunctionDef, which makes it
	unusable with this algorithm).

	Args:
	tensor_name: the name of the resource tensor to be resolved to an input.
	input_names: a list of the names of all inputs to the function.
	node_defs: a dict mapping op name -> NodeDef for every op in the function.
	functions: a dict mapping function name -> _EagerDefinedFunction.

	Returns:
	The index into input_names corresponding to `tensor_name`.
	"""
	while tensor_name not in input_names:
	# FunctionDefs and graphs use different tensor naming conventions.
	parts = tensor_name.split(":")
	if len(parts) == 3:
	op_name, _, output_idx = parts
	elif len(parts) == 2:
	op_name, output_idx = parts
	else:
	assert len(parts) == 1
	op_name = parts[0]
	output_idx = 0
	output_idx = int(output_idx)
	node_def = node_defs[op_name]

	if node_def.op == "While":
	# Captured resources occur at the same index in the lists of inputs and
	# outputs of a while op. So we lookup the input of `tensor.op` at the
	# same index as the index of `tensor` in the `tensor.op.outputs`.
	tensor_name = node_def.input[output_idx]
	elif node_def.op in ("PartitionedCall", "StatefulPartitionedCall"):
	# Functions output any captured resource tensors used by their
	# gradients. `tensor_name` is one of these outputs from a nested
	# function call, so recursively find the corresponding input in the
	# nested FunctionDef.
	func_name = node_def.attr["f"].func.name
	fdef = functions[func_name].definition
	output_arg_name = fdef.signature.output_arg[output_idx].name
	output_tensor_name = fdef.ret[output_arg_name]
	input_index = resource_input_index(
	output_tensor_name, [arg.name for arg in fdef.signature.input_arg],
	{ndef.name: ndef for ndef in fdef.node_def}, functions)
	tensor_name = node_def.input[input_index]
	else:
	# We assume there are no other ops types that will "forward" resource
	# handles like this, so all other handles must have been created by the
	# op. (Note that cond_v2 wraps resource handle outputs in optionals,
	# which we'll end up accumulating).
	raise ValueError("Taking gradient of a while loop which creates "
	"a resource in its body is not supported: %s" % op_name)

	return input_names.index(tensor_name)


	@tf_contextlib.contextmanager
	def clear_control_inputs():
	"""Clears the control inputs but preserves the ControlFlowContext.

	This is needed to preserve the XLAControlFlowControl when clearing
	control inputs for the gradient accumulators in while_v2.
	`ops.control_dependencies` does not allow that.

	Yields:
	A context manager in which the ops created will not have any control inputs
	by default but the control flow context is the same.
	"""
	# pylint: disable=protected-access
	control_flow_context = ops.get_default_graph()._get_control_flow_context()
	with ops.control_dependencies(None):
	ops.get_default_graph()._set_control_flow_context(control_flow_context)
	yield
	# pylint: enable=protected-access


	def _is_tpu_strategy(strategy):
	return (strategy is not None and
	strategy.__class__.__name__.startswith("TPUStrategy"))


	def _is_building_keras_layer():
	return base_layer_utils.call_context().layer is not None


	def output_all_intermediates():
	"""Whether to output all intermediates of a functional control flow op.

	The default behavior is to output intermediates only when building a Keras
	Layer in graph mode and that too when certain other conditions are met:
	1. We do not output intermediates if the functional control flow op
	is being built inside a FuncGraph which is not a If/While graph. This
	guards against outputting intermediates in eager mode since keras adds
	tensors to a FuncGraph named "keras_graph" in that case. Also because we
	do not output intermediates of tf.function (since this feature is only for
	backwards compatibility) outputting intermediates of functional control
	flow ops built inside tf.function is of no value.
	2. We do not output intermediates when the compilation is using XLA or for a
	TPU.
	3. We do not output intermediates when a single threaded executor is used
	since that does not perform inlining and pruning.

	Returns:
	A bool telling whether to output all intermediates.
	"""
	if _EXPERIMENTAL_OUTPUT_ALL_INTERMEDIATES_OVERRIDE is not None:
	return _EXPERIMENTAL_OUTPUT_ALL_INTERMEDIATES_OVERRIDE
	if in_defun():
	return False
	if (control_flow_util.GraphOrParentsInXlaContext(ops.get_default_graph()) or
	_is_tpu_strategy(distribution_strategy_context.get_strategy())):
	return False
	if (context.context().function_call_options.executor_type ==
	"SINGLE_THREADED_EXECUTOR"):
	return False
	return _is_building_keras_layer()