kernels/portable/cpu/op_gelu.cpp - platform/external/executorch - Git at Google

 /*
  * Copyright (c) Meta Platforms, Inc. and affiliates.
  * All rights reserved.
  *
  * This source code is licensed under the BSD-style license found in the
  * LICENSE file in the root directory of this source tree.
  */

 #include <cmath>

 #include <executorch/kernels/portable/cpu/math_constants.h>
 #include <executorch/kernels/portable/cpu/util/activation_ops_util.h>
 #include <executorch/kernels/portable/cpu/util/functional_util.h>
 #include <executorch/runtime/kernel/kernel_includes.h>

 namespace torch {
 namespace executor {
 namespace native {

 using Tensor = exec_aten::Tensor;
 using ScalarType = exec_aten::ScalarType;
 using string_view = exec_aten::string_view;

 Tensor& gelu_out(
     RuntimeContext& ctx,
     const Tensor& in,
     string_view approximate,
     Tensor& out) {
   (void)ctx;

   ET_KERNEL_CHECK(
       ctx, check_gelu_args(in, approximate, out), InvalidArgument, out);

   ET_KERNEL_CHECK(
       ctx, resize_tensor(out, in.sizes()) == Error::Ok, InvalidArgument, out);

   ET_KERNEL_CHECK(
       ctx, tensors_have_same_dim_order(in, out), InvalidArgument, out);

   ET_SWITCH_FLOAT_TYPES(in.scalar_type(), ctx, "gelu.out", CTYPE, [&]() {
     if (approximate == "tanh") {
       apply_unary_map_fn(
           [](const CTYPE x) {
             if (x == -std::numeric_limits<CTYPE>::infinity()) {
               return static_cast<CTYPE>(0.0);
             } else if (x == std::numeric_limits<CTYPE>::infinity()) {
               return std::numeric_limits<CTYPE>::infinity();
             }
             const CTYPE kBeta = M_SQRT2 * M_2_SQRTPI * 0.5;
             const CTYPE kKappa = static_cast<float>(0.044715);

             const CTYPE x_cubed = x * x * x;
             const CTYPE inner = kBeta * (x + kKappa * x_cubed);
             const CTYPE ret = 0.5 * x * (1 + std::tanh(inner));

             return ret;
           },
           in.const_data_ptr<CTYPE>(),
           out.mutable_data_ptr<CTYPE>(),
           in.numel());
     } else if (approximate == "none") {
       apply_unary_map_fn(
           [](const CTYPE x) {
             if (x == -std::numeric_limits<CTYPE>::infinity()) {
               return static_cast<CTYPE>(0.0);
             } else if (x == std::numeric_limits<CTYPE>::infinity()) {
               return std::numeric_limits<CTYPE>::infinity();
             }
             return static_cast<CTYPE>(0.5 * x * (1 + std::erf(x * M_SQRT1_2)));
           },
           in.const_data_ptr<CTYPE>(),
           out.mutable_data_ptr<CTYPE>(),
           in.numel());
     } else {
       ET_CHECK_MSG(
           false,
           "Invalid approximation format: %.*s for gelu",
           static_cast<int>(approximate.length()),
           approximate.data());
     }
   });

   return out;
 }

 } // namespace native
 } // namespace executor
 } // namespace torch
	/*
	* Copyright (c) Meta Platforms, Inc. and affiliates.
	* All rights reserved.
	*
	* This source code is licensed under the BSD-style license found in the
	* LICENSE file in the root directory of this source tree.
	*/

	#include <cmath>

	#include <executorch/kernels/portable/cpu/math_constants.h>
	#include <executorch/kernels/portable/cpu/util/activation_ops_util.h>
	#include <executorch/kernels/portable/cpu/util/functional_util.h>
	#include <executorch/runtime/kernel/kernel_includes.h>

	namespace torch {
	namespace executor {
	namespace native {

	using Tensor = exec_aten::Tensor;
	using ScalarType = exec_aten::ScalarType;
	using string_view = exec_aten::string_view;

	Tensor& gelu_out(
	RuntimeContext& ctx,
	const Tensor& in,
	string_view approximate,
	Tensor& out) {
	(void)ctx;

	ET_KERNEL_CHECK(
	ctx, check_gelu_args(in, approximate, out), InvalidArgument, out);

	ET_KERNEL_CHECK(
	ctx, resize_tensor(out, in.sizes()) == Error::Ok, InvalidArgument, out);

	ET_KERNEL_CHECK(
	ctx, tensors_have_same_dim_order(in, out), InvalidArgument, out);

	ET_SWITCH_FLOAT_TYPES(in.scalar_type(), ctx, "gelu.out", CTYPE, [&]() {
	if (approximate == "tanh") {
	apply_unary_map_fn(
	[](const CTYPE x) {
	if (x == -std::numeric_limits<CTYPE>::infinity()) {
	return static_cast<CTYPE>(0.0);
	} else if (x == std::numeric_limits<CTYPE>::infinity()) {
	return std::numeric_limits<CTYPE>::infinity();
	}
	const CTYPE kBeta = M_SQRT2 * M_2_SQRTPI * 0.5;
	const CTYPE kKappa = static_cast<float>(0.044715);

	const CTYPE x_cubed = x * x * x;
	const CTYPE inner = kBeta * (x + kKappa * x_cubed);
	const CTYPE ret = 0.5 * x * (1 + std::tanh(inner));

	return ret;
	},
	in.const_data_ptr<CTYPE>(),
	out.mutable_data_ptr<CTYPE>(),
	in.numel());
	} else if (approximate == "none") {
	apply_unary_map_fn(
	[](const CTYPE x) {
	if (x == -std::numeric_limits<CTYPE>::infinity()) {
	return static_cast<CTYPE>(0.0);
	} else if (x == std::numeric_limits<CTYPE>::infinity()) {
	return std::numeric_limits<CTYPE>::infinity();
	}
	return static_cast<CTYPE>(0.5 * x * (1 + std::erf(x * M_SQRT1_2)));
	},
	in.const_data_ptr<CTYPE>(),
	out.mutable_data_ptr<CTYPE>(),
	in.numel());
	} else {
	ET_CHECK_MSG(
	false,
	"Invalid approximation format: %.*s for gelu",
	static_cast<int>(approximate.length()),
	approximate.data());
	}
	});

	return out;
	}

	} // namespace native
	} // namespace executor
	} // namespace torch