tensorflow/contrib/distributions/python/ops/bijectors/sinh_arcsinh.py - platform/external/tensorflow - Git at Google

 # Copyright 2017 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 """SinhArcsinh bijector."""

 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

 import numpy as np

 from tensorflow.python.framework import ops
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import check_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops.distributions import bijector
 from tensorflow.python.util import deprecation

 __all__ = [
     "SinhArcsinh",
 ]


 @deprecation.deprecated(
     "2018-10-01",
     "The TensorFlow Distributions library has moved to "
     "TensorFlow Probability "
     "(https://github.com/tensorflow/probability). You "
     "should update all references to use `tfp.distributions` "
     "instead of `tf.contrib.distributions`.",
     warn_once=True)
 def _sqrtx2p1(x):
   """Implementation of `sqrt(1 + x**2)` which is stable despite large `x`."""
   return array_ops.where_v2(
       math_ops.abs(x) * np.sqrt(np.finfo(x.dtype.as_numpy_dtype).eps) <= 1.,
       math_ops.sqrt(x**2. + 1.),
       # For large x, calculating x**2 can overflow. This can be alleviated by
       # considering:
       # sqrt(1 + x**2)
       # = exp(0.5 log(1 + x**2))
       # = exp(0.5 log(x**2 * (1 + x**-2)))
       # = exp(log(x) + 0.5 * log(1 + x**-2))
       # = |x| * exp(0.5 log(1 + x**-2))
       # = |x| * sqrt(1 + x**-2)
       # We omit the last term in this approximation.
       # When |x| > 1 / sqrt(machineepsilon), the second term will be 1,
       # due to sqrt(1 + x**-2) = 1. This is also true with the gradient term,
       # and higher order gradients, since the first order derivative of
       # sqrt(1 + x**-2) is -2 * x**-3 / (1 + x**-2) = -2 / (x**3 + x),
       # and all nth-order derivatives will be O(x**-(n + 2)). This makes any
       # gradient terms that contain any derivatives of sqrt(1 + x**-2) vanish.
       math_ops.abs(x))


 class SinhArcsinh(bijector.Bijector):
   """Compute `Y = g(X) = Sinh( (Arcsinh(X) + skewness) * tailweight )`.

   For `skewness in (-inf, inf)` and `tailweight in (0, inf)`, this
   transformation is a
   diffeomorphism of the real line `(-inf, inf)`.  The inverse transform is
   `X = g^{-1}(Y) = Sinh( ArcSinh(Y) / tailweight - skewness )`.

   The `SinhArcsinh` transformation of the Normal is described in
   [Sinh-arcsinh distributions](https://www.jstor.org/stable/27798865)
   This Bijector allows a similar transformation of any distribution supported on
   `(-inf, inf)`.

   #### Meaning of the parameters

   * If `skewness = 0` and `tailweight = 1`, this transform is the identity.
   * Positive (negative) `skewness` leads to positive (negative) skew.
     * positive skew means, for unimodal `X` centered at zero, the mode of `Y` is
       "tilted" to the right.
     * positive skew means positive values of `Y` become more likely, and
       negative values become less likely.
   * Larger (smaller) `tailweight` leads to fatter (thinner) tails.
     * Fatter tails mean larger values of `|Y|` become more likely.
     * If `X` is a unit Normal, `tailweight < 1` leads to a distribution that is
       "flat" around `Y = 0`, and a very steep drop-off in the tails.
     * If `X` is a unit Normal, `tailweight > 1` leads to a distribution more
       peaked at the mode with heavier tails.

   To see the argument about the tails, note that for `|X| >> 1` and
   `|X| >> (|skewness| * tailweight)**tailweight`, we have
   `Y approx 0.5 X**tailweight e**(sign(X) skewness * tailweight)`.
   """

   @deprecation.deprecated(
       "2018-10-01",
       "The TensorFlow Distributions library has moved to "
       "TensorFlow Probability "
       "(https://github.com/tensorflow/probability). You "
       "should update all references to use `tfp.distributions` "
       "instead of `tf.contrib.distributions`.",
       warn_once=True)
   def __init__(self,
                skewness=None,
                tailweight=None,
                validate_args=False,
                name="SinhArcsinh"):
     """Instantiates the `SinhArcsinh` bijector.

     Args:
       skewness:  Skewness parameter.  Float-type `Tensor`.  Default is `0`
         of type `float32`.
       tailweight:  Tailweight parameter.  Positive `Tensor` of same `dtype` as
         `skewness` and broadcastable `shape`.  Default is `1` of type `float32`.
       validate_args: Python `bool` indicating whether arguments should be
         checked for correctness.
       name: Python `str` name given to ops managed by this object.
     """
     self._graph_parents = []
     self._name = name
     self._validate_args = validate_args
     with self._name_scope("init", values=[skewness, tailweight]):
       tailweight = 1. if tailweight is None else tailweight
       skewness = 0. if skewness is None else skewness
       self._skewness = ops.convert_to_tensor(
           skewness, name="skewness")
       self._tailweight = ops.convert_to_tensor(
           tailweight, name="tailweight", dtype=self._skewness.dtype)
       check_ops.assert_same_float_dtype([self._skewness, self._tailweight])
       if validate_args:
         self._tailweight = control_flow_ops.with_dependencies([
             check_ops.assert_positive(
                 self._tailweight,
                 message="Argument tailweight was not positive")
         ], self._tailweight)
     super(SinhArcsinh, self).__init__(
         forward_min_event_ndims=0,
         validate_args=validate_args,
         name=name)

   @property
   def skewness(self):
     """The `skewness` in: `Y  = Sinh((Arcsinh(X) + skewness) * tailweight)`."""
     return self._skewness

   @property
   def tailweight(self):
     """The `tailweight` in: `Y = Sinh((Arcsinh(X) + skewness) * tailweight)`."""
     return self._tailweight

   def _forward(self, x):
     return math_ops.sinh((math_ops.asinh(x) + self.skewness) * self.tailweight)

   def _inverse(self, y):
     return math_ops.sinh(math_ops.asinh(y) / self.tailweight - self.skewness)

   def _inverse_log_det_jacobian(self, y):
     # x = sinh(arcsinh(y) / tailweight - skewness)
     # Using sinh' = cosh, arcsinh'(y) = 1 / sqrt(y**2 + 1),
     # dx/dy
     # = cosh(arcsinh(y) / tailweight - skewness)
     #     / (tailweight * sqrt(y**2 + 1))

     # This is computed inside the log to avoid catastrophic cancellations
     # from cosh((arcsinh(y) / tailweight) - skewness) and sqrt(x**2 + 1).
     return (
         math_ops.log(math_ops.cosh(
             math_ops.asinh(y) / self.tailweight - self.skewness)
                      # TODO(srvasude): Consider using cosh(arcsinh(x)) in cases
                      # where (arcsinh(x) / tailweight) - skewness ~= arcsinh(x).
                      / _sqrtx2p1(y))
         - math_ops.log(self.tailweight))

   def _forward_log_det_jacobian(self, x):
     # y = sinh((arcsinh(x) + skewness) * tailweight)
     # Using sinh' = cosh, arcsinh'(x) = 1 / sqrt(x**2 + 1),
     # dy/dx
     # = cosh((arcsinh(x) + skewness) * tailweight) * tailweight / sqrt(x**2 + 1)

     # This is computed inside the log to avoid catastrophic cancellations
     # from cosh((arcsinh(x) + skewness) * tailweight) and sqrt(x**2 + 1).
     return (
         math_ops.log(math_ops.cosh(
             (math_ops.asinh(x) + self.skewness) * self.tailweight)
                      # TODO(srvasude): Consider using cosh(arcsinh(x)) in cases
                      # where (arcsinh(x) + skewness) * tailweight ~= arcsinh(x).
                      / _sqrtx2p1(x))
         + math_ops.log(self.tailweight))
	# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# ==============================================================================
	"""SinhArcsinh bijector."""

	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function

	import numpy as np

	from tensorflow.python.framework import ops
	from tensorflow.python.ops import array_ops
	from tensorflow.python.ops import check_ops
	from tensorflow.python.ops import control_flow_ops
	from tensorflow.python.ops import math_ops
	from tensorflow.python.ops.distributions import bijector
	from tensorflow.python.util import deprecation

	__all__ = [
	"SinhArcsinh",
	]


	@deprecation.deprecated(
	"2018-10-01",
	"The TensorFlow Distributions library has moved to "
	"TensorFlow Probability "
	"(https://github.com/tensorflow/probability). You "
	"should update all references to use `tfp.distributions` "
	"instead of `tf.contrib.distributions`.",
	warn_once=True)
	def _sqrtx2p1(x):
	"""Implementation of `sqrt(1 + x**2)` which is stable despite large `x`."""
	return array_ops.where_v2(
	math_ops.abs(x) * np.sqrt(np.finfo(x.dtype.as_numpy_dtype).eps) <= 1.,
	math_ops.sqrt(x**2. + 1.),
	# For large x, calculating x**2 can overflow. This can be alleviated by
	# considering:
	# sqrt(1 + x**2)
	# = exp(0.5 log(1 + x**2))
	# = exp(0.5 log(x*2 (1 + x**-2)))
	# = exp(log(x) + 0.5 * log(1 + x**-2))
	# = \|x\| * exp(0.5 log(1 + x**-2))
	# = \|x\| * sqrt(1 + x**-2)
	# We omit the last term in this approximation.
	# When \|x\| > 1 / sqrt(machineepsilon), the second term will be 1,
	# due to sqrt(1 + x**-2) = 1. This is also true with the gradient term,
	# and higher order gradients, since the first order derivative of
	# sqrt(1 + x*-2) is -2 x-3 / (1 + x-2) = -2 / (x**3 + x),
	# and all nth-order derivatives will be O(x**-(n + 2)). This makes any
	# gradient terms that contain any derivatives of sqrt(1 + x**-2) vanish.
	math_ops.abs(x))


	class SinhArcsinh(bijector.Bijector):
	"""Compute `Y = g(X) = Sinh( (Arcsinh(X) + skewness) * tailweight )`.

	For `skewness in (-inf, inf)` and `tailweight in (0, inf)`, this
	transformation is a
	diffeomorphism of the real line `(-inf, inf)`. The inverse transform is
	`X = g^{-1}(Y) = Sinh( ArcSinh(Y) / tailweight - skewness )`.

	The `SinhArcsinh` transformation of the Normal is described in
	[Sinh-arcsinh distributions](https://www.jstor.org/stable/27798865)
	This Bijector allows a similar transformation of any distribution supported on
	`(-inf, inf)`.

	#### Meaning of the parameters

	* If `skewness = 0` and `tailweight = 1`, this transform is the identity.
	* Positive (negative) `skewness` leads to positive (negative) skew.
	* positive skew means, for unimodal `X` centered at zero, the mode of `Y` is
	"tilted" to the right.
	* positive skew means positive values of `Y` become more likely, and
	negative values become less likely.
	* Larger (smaller) `tailweight` leads to fatter (thinner) tails.
	* Fatter tails mean larger values of `\|Y\|` become more likely.
	* If `X` is a unit Normal, `tailweight < 1` leads to a distribution that is
	"flat" around `Y = 0`, and a very steep drop-off in the tails.
	* If `X` is a unit Normal, `tailweight > 1` leads to a distribution more
	peaked at the mode with heavier tails.

	To see the argument about the tails, note that for `\|X\| >> 1` and
	`\|X\| >> (\|skewness\| * tailweight)**tailweight`, we have
	`Y approx 0.5 Xtailweight e(sign(X) skewness * tailweight)`.
	"""

	@deprecation.deprecated(
	"2018-10-01",
	"The TensorFlow Distributions library has moved to "
	"TensorFlow Probability "
	"(https://github.com/tensorflow/probability). You "
	"should update all references to use `tfp.distributions` "
	"instead of `tf.contrib.distributions`.",
	warn_once=True)
	def __init__(self,
	skewness=None,
	tailweight=None,
	validate_args=False,
	name="SinhArcsinh"):
	"""Instantiates the `SinhArcsinh` bijector.

	Args:
	skewness: Skewness parameter. Float-type `Tensor`. Default is `0`
	of type `float32`.
	tailweight: Tailweight parameter. Positive `Tensor` of same `dtype` as
	`skewness` and broadcastable `shape`. Default is `1` of type `float32`.
	validate_args: Python `bool` indicating whether arguments should be
	checked for correctness.
	name: Python `str` name given to ops managed by this object.
	"""
	self._graph_parents = []
	self._name = name
	self._validate_args = validate_args
	with self._name_scope("init", values=[skewness, tailweight]):
	tailweight = 1. if tailweight is None else tailweight
	skewness = 0. if skewness is None else skewness
	self._skewness = ops.convert_to_tensor(
	skewness, name="skewness")
	self._tailweight = ops.convert_to_tensor(
	tailweight, name="tailweight", dtype=self._skewness.dtype)
	check_ops.assert_same_float_dtype([self._skewness, self._tailweight])
	if validate_args:
	self._tailweight = control_flow_ops.with_dependencies([
	check_ops.assert_positive(
	self._tailweight,
	message="Argument tailweight was not positive")
	], self._tailweight)
	super(SinhArcsinh, self).__init__(
	forward_min_event_ndims=0,
	validate_args=validate_args,
	name=name)

	@property
	def skewness(self):
	"""The `skewness` in: `Y = Sinh((Arcsinh(X) + skewness) * tailweight)`."""
	return self._skewness

	@property
	def tailweight(self):
	"""The `tailweight` in: `Y = Sinh((Arcsinh(X) + skewness) * tailweight)`."""
	return self._tailweight

	def _forward(self, x):
	return math_ops.sinh((math_ops.asinh(x) + self.skewness) * self.tailweight)

	def _inverse(self, y):
	return math_ops.sinh(math_ops.asinh(y) / self.tailweight - self.skewness)

	def _inverse_log_det_jacobian(self, y):
	# x = sinh(arcsinh(y) / tailweight - skewness)
	# Using sinh' = cosh, arcsinh'(y) = 1 / sqrt(y**2 + 1),
	# dx/dy
	# = cosh(arcsinh(y) / tailweight - skewness)
	# / (tailweight * sqrt(y**2 + 1))

	# This is computed inside the log to avoid catastrophic cancellations
	# from cosh((arcsinh(y) / tailweight) - skewness) and sqrt(x**2 + 1).
	return (
	math_ops.log(math_ops.cosh(
	math_ops.asinh(y) / self.tailweight - self.skewness)
	# TODO(srvasude): Consider using cosh(arcsinh(x)) in cases
	# where (arcsinh(x) / tailweight) - skewness ~= arcsinh(x).
	/ _sqrtx2p1(y))
	- math_ops.log(self.tailweight))

	def _forward_log_det_jacobian(self, x):
	# y = sinh((arcsinh(x) + skewness) * tailweight)
	# Using sinh' = cosh, arcsinh'(x) = 1 / sqrt(x**2 + 1),
	# dy/dx
	# = cosh((arcsinh(x) + skewness) * tailweight) * tailweight / sqrt(x**2 + 1)

	# This is computed inside the log to avoid catastrophic cancellations
	# from cosh((arcsinh(x) + skewness) * tailweight) and sqrt(x**2 + 1).
	return (
	math_ops.log(math_ops.cosh(
	(math_ops.asinh(x) + self.skewness) * self.tailweight)
	# TODO(srvasude): Consider using cosh(arcsinh(x)) in cases
	# where (arcsinh(x) + skewness) * tailweight ~= arcsinh(x).
	/ _sqrtx2p1(x))
	+ math_ops.log(self.tailweight))