Fix binary size in schema inference (#26878) Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/26878 Before, for each function signature used in one or more ops, there's a template instantiation that creates the FunctionSchema object for it. As we've seen in the past, all these vector<> constructors in the FunctionSchema object take quite some binary size. With this PR, we now create an intermediate constexpr std::array that has minimal binary size and can be embedded into the executable, then at runtime we will run a small piece of code that constructs the vector<>'s from it. This reduces libtorch.so binary size by 800kb ghstack-source-id: 90842811 Test Plan: measure libtorch.so size Differential Revision: D17597752 fbshipit-source-id: 53442b565a7747c0d0384b2e3b845729c3daddfd

commit: 771bcce6f1a09bee5f0b78f967dd2ab9ebc11817 [log] [tgz]
author: Sebastian Messmer <messmer@fb.com> Thu Sep 26 16:53:13 2019 -0700
committer: Facebook Github Bot <facebook-github-bot@users.noreply.github.com> Thu Sep 26 16:59:00 2019 -0700
tree: 89610be2d184e97dd4715e53065d1e2e3f69bb67
parent: 54b66c8c203b3b5c11d9bb6eca9dae45902bd967 [diff]
diff --git a/aten/src/ATen/core/op_registration/infer_schema.h b/aten/src/ATen/core/op_registration/infer_schema.h
index 968c04e..9971435 100644
--- a/aten/src/ATen/core/op_registration/infer_schema.h
+++ b/aten/src/ATen/core/op_registration/infer_schema.h

@@ -10,45 +10,63 @@
 #include <c10/util/Metaprogramming.h>
 
 namespace c10 {
-
 namespace detail {
-/// Checks the static C++ type `T` for correctness to catch common error cases.
-template <typename T>
-void checkStaticTypes() {
+
+namespace infer_schema {
+
+/// The templated inference code creates `ArgumentDef` instead of `Argument`,
+/// because that can be constructed at compile time and has a much smaller
+/// binary size than having calls to `Argument` constructors in the template.
+/// Creating `Argument` objects from `ArgumentDef` can then be done at
+/// runtime in a non-templated way.
+struct ArgumentDef final {
+  using GetTypeFn = TypePtr();
+  GetTypeFn* getTypeFn;
+};
+
+template<bool V>
+struct bool_t {};
+template<> struct bool_t<true> : std::true_type {};
+template<> struct bool_t<false> : std::false_type {};
+
+/// Checks the static C++ types `Types` for correctness to catch common error cases.
+template <class... Types>
+constexpr int checkStaticTypes() {
  // Give nice error messages for some of the common error cases.
  // Use a LOUD ERROR MESSAGE SO USERS SEE THE STATIC_ASSERT
- static_assert(
-     !std::is_integral<T>::value || std::is_same<T, int64_t>::value || std::is_same<T, bool>::value,
-     "INVALID TYPE: Only int64_t and bool are supported as an integral argument type");
- static_assert(
-     !std::is_same<T, float>::value,
-     "INVALID TYPE: float is not supported as an argument type, use double instead");
+ static_assert(guts::conjunction<
+     bool_t<!std::is_integral<Types>::value || std::is_same<Types, int64_t>::value || std::is_same<Types, bool>::value>...
+   >::value, "INVALID TYPE: Only int64_t and bool are supported as an integral argument type");
+ static_assert(guts::conjunction<
+     bool_t<!std::is_same<Types, float>::value>...
+   >::value, "INVALID TYPE: float is not supported as an argument type, use double instead");
+ return 0;
 }
 
 template <typename... Ts, size_t... Is>
-::std::vector<Argument> createArgumentVectorFromTypes(guts::index_sequence<Is...>) {
-  // Check types for common errors
-  (void)std::initializer_list<int>{(
-    checkStaticTypes<Ts>()
-  , 0)...};
+constexpr std::array<ArgumentDef, sizeof...(Ts)> createArgumentVectorFromTypes(guts::index_sequence<Is...>) {
+  return (
+    // Check types for common errors
+    checkStaticTypes<Ts...>(),
 
-  // Arguments are named "_<index>"
-  return {Argument("_" + c10::guts::to_string(Is), getTypePtr<guts::decay_t<Ts>>())...};
+    // Create the return value
+    std::array<ArgumentDef, sizeof...(Ts)>{{ArgumentDef{&getTypePtr_<guts::decay_t<Ts>>::call}...}}
+  );
 }
 
-/// Creates a vector of `Argument` from a list of C++ types that are specified
+/// Creates a vector of `ArgumentDef` from a list of C++ types that are specified
 /// as template arguments.
 template<class ParameterTypes> struct createArguments final {};
 template<class... ParameterTypes>
 struct createArguments<guts::typelist::typelist<ParameterTypes...>> final {
-  static std::vector<Argument> call() {
+  static constexpr std::array<ArgumentDef, sizeof...(ParameterTypes)> call() {
     return createArgumentVectorFromTypes<ParameterTypes...>(
         guts::make_index_sequence<sizeof...(ParameterTypes)>()
     );
   }
 };
 
-/// Creates a vector of `Argument` from a list of C++ types that are specified
+/// Creates a vector of `ArgumentDef` from a list of C++ types that are specified
 /// as a tuple (i.e. in the way c10 kernels return values).
 /// It can be a tuple<A, B, C> if there's three output arguments with types A, B, C.
 /// It can be an empty tuple<>, or void for kernels that don't return anything.
@@ -58,7 +76,7 @@
 
 template<class... ReturnTypes>
 struct createReturns<std::tuple<ReturnTypes...>, void> final {
-  static std::vector<Argument> call() {
+  static constexpr std::array<ArgumentDef, sizeof...(ReturnTypes)> call() {
     return createArgumentVectorFromTypes<ReturnTypes...>(
         guts::make_index_sequence<sizeof...(ReturnTypes)>()
     );
@@ -67,24 +85,40 @@
 
 template<class ReturnType>
 struct createReturns<ReturnType, guts::enable_if_t<!std::is_same<void, ReturnType>::value && !guts::is_instantiation_of<std::tuple, ReturnType>::value>> final {
-  static std::vector<Argument> call() {
+  static constexpr std::array<ArgumentDef, 1> call() {
     return createReturns<std::tuple<ReturnType>>::call();
   }
 };
 
 template<>
 struct createReturns<void, void> final {
-  static std::vector<Argument> call() {
+  static constexpr std::array<ArgumentDef, 0> call() {
     return createReturns<std::tuple<>>::call();
   }
 };
 
-// This is intentionally a separate function and not part of createFunctionSchemaFromTraits
+template<size_t NumArgs>
+std::vector<Argument> createArgumentVector(const std::array<ArgumentDef, NumArgs>& args) {
+  std::vector<Argument> result;
+  result.reserve(NumArgs);
+  for (size_t i = 0; i < args.size(); ++i) {
+    // Arguments are named "_<index>"
+    result.push_back(Argument("_" + c10::guts::to_string(i), (*args[i].getTypeFn)()));
+  }
+  return result;
+}
+
+// This is intentionally a separate function
 // because then the template is smaller and that benefits binary size
 inline FunctionSchema make_function_schema(std::string&& name, std::string&& overload_name, std::vector<Argument>&& arguments, std::vector<Argument>&& returns) {
   return FunctionSchema(std::move(name), std::move(overload_name), std::move(arguments), std::move(returns));
 }
 
+template<size_t NumArgs, size_t NumReturns>
+inline FunctionSchema make_function_schema(std::string&& name, std::string&& overload_name, const std::array<ArgumentDef, NumArgs>& arguments, const std::array<ArgumentDef, NumReturns>& returns) {
+  return make_function_schema(std::move(name), std::move(overload_name), createArgumentVector(arguments), createArgumentVector(returns));
+}
+
 /// Creates a `FunctionSchema` object from a `FunctionTraits` type for a
 /// function.
 template <typename FunctionTraits>
@@ -92,13 +126,17 @@
  using ReturnType = typename FunctionTraits::return_type;
  using ParameterTypes = typename FunctionTraits::parameter_types;
 
- return make_function_schema(std::move(name), std::move(overload_name), createArguments<ParameterTypes>::call(), createReturns<ReturnType>::call());
+ constexpr auto arguments = createArguments<ParameterTypes>::call();
+ constexpr auto returns = createReturns<ReturnType>::call();
+
+ return make_function_schema(std::move(name), std::move(overload_name), arguments, returns);
+}
 }
 }
 
 template<class FuncType>
 FunctionSchema inferFunctionSchema(std::string&& name, std::string&& overload_name) {
-  return detail::createFunctionSchemaFromTraits<guts::infer_function_traits_t<FuncType>>(std::move(name), std::move(overload_name));
+  return detail::infer_schema::createFunctionSchemaFromTraits<guts::infer_function_traits_t<FuncType>>(std::move(name), std::move(overload_name));
 }
 
 CAFFE2_API c10::optional<std::string> findSchemaDifferences(const FunctionSchema& inferred, const FunctionSchema& specified);
commit	771bcce6f1a09bee5f0b78f967dd2ab9ebc11817	[log] [tgz]
author	Sebastian Messmer <messmer@fb.com>	Thu Sep 26 16:53:13 2019 -0700
committer	Facebook Github Bot <facebook-github-bot@users.noreply.github.com>	Thu Sep 26 16:59:00 2019 -0700
tree	89610be2d184e97dd4715e53065d1e2e3f69bb67
parent	54b66c8c203b3b5c11d9bb6eca9dae45902bd967 [diff]