tools/jit/gen_jit_dispatch.py - platform/external/pytorch - Git at Google

 import os
 import argparse
 import re
 from itertools import count, combinations, groupby
 from ..autograd.utils import CodeTemplate, write, uninplace_api_name
 from ..autograd.gen_autograd import load_aten_declarations
 from collections import OrderedDict

 # JIT has a type system of
 # Scalar = int | float | bool # int is the largest int (int64_t),
 # float is the largest float (double) we don't have the others because they are never held in tensors
 # Type = Scalar # primitive numbers
 #      | Tensor # any tensor, as defined by at::Tensor
 #      | Type[] # a dynamically sized list[ of a type
 #      | Scalar[N] # a homogenous fixed size scalar list, single scalars can expand to this list
 #      | (Type1, Type2, ...) # a heterogenous tuple
 #      | Layout | ScalarType | Device | Generator # special singleton types for built-in concepts in tensor lib

 # clean up the variety of C++ types in the ATen declarations
 # to be in the restricted set of types that the IR represents
 # note: no default values for this map, to make it clear what types
 # can be passedthrough

 TYPE_MAP = {
     'std::array<bool,2>': 'bool[2]',
     'std::array<bool,3>': 'bool[3]',
     'std::array<bool,4>': 'bool[4]',
     'Scalar': 'Scalar',
     'Tensor': 'Tensor',
     'TensorList': 'Tensor[]',
     # this appears in return values instead of TensorList
     # since TensorList is a ArrayRef in arguments but a vector
     # in returns
     'std::vector<Tensor>': 'Tensor[]',
     'IntList': 'int[]',
     'Layout': 'Layout',
     'Device': 'Device',
     'ScalarType': 'ScalarType',
     'int64_t': 'int',
     'double': 'float',
     'bool': 'bool',
     'Generator': 'Generator',
 }


 def jit_type_of(arg):
     typ = TYPE_MAP[arg['simple_type']]
     if is_sized_intlist_arg(arg):
         typ = 'int[{}]'.format(arg['size'])

     if arg.get('is_nullable'):
         typ = '{}?'.format(typ)
     return typ


 # map from aten 'simple_type' to the function that will turn a tensor into
 # that type
 FROM_IVALUE = {
     'Device': 'as_device({}.toIntList()->elements())',
     'IntList': '{}.toIntList()->elements()',
     'Layout': 'static_cast<at::Layout>({}.toInt())',
     'Scalar': '{}.toScalar()',
     'ScalarType': 'static_cast<at::ScalarType>({}.toInt())',
     'Tensor': '{}.toTensor()',
     'TensorList': '{}.toTensorList()->elements()',
     'bool': 'bool({}.toInt())',
     'double': '{}.toDouble()',
     'int64_t': '{}.toInt()',
     'std::array<bool,2>': 'as_bool_array<2>({}.toIntList()->elements())',
     'std::array<bool,3>': 'as_bool_array<3>({}.toIntList()->elements())',
     'std::array<bool,4>': 'as_bool_array<4>({}.toIntList()->elements())',
 }


 def from_ivalue(arg, value):
     simple_type = arg['simple_type']
     return FROM_IVALUE[simple_type].format(value)


 CALL_NAMESPACE = CodeTemplate("""\
 auto result = at::${name}(
     ${args}
 );
 """)
 CALL_METHOD = CodeTemplate("""\
 DeviceGuard device_guard(deviceForInputs(stack, ${num_inputs}));
 auto result = (${first}).${name}(
     ${args}
 );
 """)
 CALL_TENSOR_OPTIONS = CodeTemplate("""\
 const auto options = TensorOptions()
         .dtype(${dtype})
         .layout(${layout})
         .device(${device});
 auto result = torch::${name}(
     ${args},
     options
 );
 """)

 CONSTRUCTOR = CodeTemplate("""\
 [](Stack & stack) {
     autograd::profiler::RecordFunction record("${name}");
     ${call}
     drop(stack, ${num_inputs});
     pack(stack, std::move(result));
     return 0;
 }
 """)

 OPERATOR = CodeTemplate("""\
 Operator(
     "${signature}",
     ${op}
 ),
 """)


 def is_magic_method(api_name):
     return api_name.startswith('__') and api_name.endswith('__')


 blacklisted_types = {'SparseTensorRef', 'Storage', 'ScalarType', 'optional<ScalarType>', 'std::string', 'void*'}
 default_only_types = {'Generator'}


 def is_jit_arg(i, arg):
     simple_type = arg['simple_type']
     if simple_type in blacklisted_types:
         return False
     if simple_type in default_only_types and 'default' not in arg:
         return False
     if simple_type == 'Type':
         return False
     return True


 def is_jit_op(decl):
     # We currently don't support functions that return nothing
     if all(r['type'] == 'void' for r in decl['returns']):
         return False

     # we currently only support vararg tensor lists when they are the _first_ argument
     # and the only tensor argument
     arguments = decl['arguments']

     return ((not decl['api_name'].endswith('_') or is_magic_method(decl['api_name'])) and
             not decl['name'].endswith('_out') and
             ('namespace' in decl['method_of'] or 'Tensor' in decl['method_of']) and
             all(is_jit_arg(i, arg) for i, arg in enumerate(decl['arguments'])) and
             all(is_jit_arg(i, arg) for i, arg in enumerate(decl['returns'])))


 def is_tensor_arg(arg):
     return arg['simple_type'] in {'Tensor', 'TensorList'}


 def is_sized_intlist_arg(arg):
     """Returns True for arguments declared as IntList[k], but False for IntList."""
     return (arg['simple_type'] == 'IntList') and ('size' in arg)


 def gen_jit_dispatch(declarations, out, template_path):
     REGISTER_ATEN_OPS_CPP = CodeTemplate.from_file(template_path + '/register_aten_ops.cpp')
     ATEN_INTERNED_STRINGS_H = CodeTemplate.from_file(template_path + '/aten_interned_strings.h')

     ops = []

     def get_invocation(decl, args, num_inputs):

         # because the arg list can get lengthy we put them on a separate line
         def pack_arguments(args):
             return ',\n'.join(args)
         if decl.get('has_tensor_options'):
             return CALL_TENSOR_OPTIONS.substitute(name=decl['name'],
                                                   args=pack_arguments(args[:-3]),
                                                   dtype=args[-3],
                                                   layout=args[-2],
                                                   device=args[-1])
         elif 'namespace' in decl['method_of']:
             return CALL_NAMESPACE.substitute(name=decl['name'],
                                              args=pack_arguments(args),
                                              num_inputs=num_inputs)
         else:
             return CALL_METHOD.substitute(
                 name=decl['name'], first=args[0], args=pack_arguments(args[1:]),
                 num_inputs=num_inputs)

     def emit_decl_variant(decl):
         kw_assignments = []
         arguments = []
         num_inputs = len(decl['arguments'])
         op_capture = ''

         real_inputs = 0
         for arg in decl['arguments']:
             if arg['simple_type'] in default_only_types:
                 arguments.append(arg['default'])
             else:
                 value = '(std::move(peek(stack, {}, {})))'.format(real_inputs, num_inputs)
                 arguments.append(from_ivalue(arg, value))
                 real_inputs += 1

         call = get_invocation(decl, arguments, num_inputs)

         returns = decl['returns']

         constructor = CONSTRUCTOR.substitute(name=decl['name'],
                                              call=call,
                                              kw_assignments=kw_assignments,
                                              num_inputs=num_inputs,
                                              op_capture=op_capture)
         return constructor

     # This function declares an order on declarations. This is necessary because
     # there is some ambiguity in the choice of overload: if an argument is overloaded
     # to accept both Scalar and Tensor, the schema with the Tensor should come first
     # TODO: this can (probably) be removed when we remove the implicit conversion
     # from Tensor -> Number.
     def sort_decls(jit_decls):
         def declkey(decl):
             # key = sum_{i < len(args)} {1 if arg is tensor else 2} * (3 ** i)
             # This is a ternary encoding where
             # 0: No argument at this position
             # 1: Tensor argument at this position
             # 2: Some other argument at this position.
             args = decl['arguments']
             result = 0
             for i in range(len(args)):
                 result += (3 ** i) * (1 if args[i]['simple_type'] == 'Tensor' else 2)
             return result

         # NB: itertools.groupby requires the list be sorted.
         sorted_decls = sorted(jit_decls, key=lambda decl: decl['name'])
         grouped_decls = [list(g) for _, g in
                          groupby(sorted_decls, key=lambda decl: decl['name'])]
         result = []
         for group in grouped_decls:
             sorted_decls = sorted(group, key=declkey)
             result.extend(sorted_decls)
         return result

     # We need to add methods implemented manually in TensorImpl
     tensor_impl_methods = [{
         'name': name,
         'api_name': name,
         'method_of': ['Tensor'],
         'arguments': [{'name': 'self', 'simple_type': 'Tensor'}],
         'returns': [{'name': 'result', 'type': 'int64_t', 'dynamic_type': 'int64_t', 'simple_type': 'int64_t'}],
     } for name in ['sizes', 'strides', 'dim']]
     aten_decls = load_aten_declarations(declarations) + tensor_impl_methods

     jit_decls = [d for d in aten_decls if is_jit_op(d)]

     # add arguments dtype and device for functions like zeros
     for decl in jit_decls:
         arguments = decl['arguments']
         for n, arg in enumerate(arguments):
             if arg['simple_type'] == 'TensorOptions':
                 del arguments[n]
                 arguments.extend([
                     # XXX - until we actually have first-class interpreter types for these
                     # concepts, the default values to be encoded in Tensors
                     # If you change this, you also need to update [TensorOptions in script]
                     # in the tracer code.
                     # dtype is specified as an int64_t of at::ScalarType
                     {'name': 'dtype', 'simple_type': 'ScalarType', 'default': 'float', 'kwarg_only': True},
                     # layout is specified as an int64_t of at::Layout
                     {'name': 'layout', 'simple_type': 'Layout', 'default': 'strided', 'kwarg_only': True},
                     # device is specified as an IntList of { at::Device::Type, device_id }
                     {'name': 'device', 'simple_type': 'Device', 'kwarg_only': True,
                         'default': '[cpu, -1]'},
                 ])
                 decl['has_tensor_options'] = True

     jit_decls = sort_decls(jit_decls)
     for decl in jit_decls:
         ops.append(OPERATOR.substitute(signature=signature(decl),
                                        op=emit_decl_variant(decl)))

     # Sort the generated snippets to ensure that the generation is deterministic
     env = {
         'constructors': ops,
     }
     write(out, 'register_aten_ops.cpp', REGISTER_ATEN_OPS_CPP, env)

     # NB: Operate on aten_decls, not jit_decls, because VariableType is
     # a client for these symbols as well
     # NB: This means we DON'T generate interned strings for inplace ops.
     # Change this when you do!
     # NB: Keep this code synchronized with the code in
     # tool/autograd/gen_variable_type.py
     # NB: Some operations have inplace versions, but NOT non-inplace
     # versions! Thus uninplace_api_name() is mandatory (if you remove
     # it, you will get missing symbols.)
     names = set(uninplace_api_name(decl['api_name']) for decl in aten_decls)
     # NB: This grabs non keyword arguments too, but it's harmless
     attrs = set(arg['name'] for decl in aten_decls for arg in decl['arguments'])
     strings_env = {
         'aten_symbols': ["_(aten, {}) \\".format(n) for n in sorted(names)],
         'attr_symbols': ["_(attr, {}) \\".format(n) for n in sorted(attrs)]
     }
     write(out, 'aten_interned_strings.h', ATEN_INTERNED_STRINGS_H, strings_env)

 default_map = {'{}': 'None', 'nullptr': 'None'}


 def signature(decl):
     def format_arg(arg):
         name = arg['name']
         typ = jit_type_of(arg)
         decl = '{} {}'.format(typ, name)
         if 'default' in arg:
             # clean up initializer lists {{true, true}} -> [true, true]
             default = str(arg['default']) \
                 .replace('{{', '[') \
                 .replace('}}', ']') \
                 .replace('true', 'True') \
                 .replace('false', 'False') \
                 .replace('nullptr', 'None') \
                 .replace('Reduction::ElementwiseMean', 'ElementwiseMean') \
                 .replace('{}', 'None' if is_tensor_arg(arg) else '[]') \
                 .replace('{', '[') \
                 .replace('}', ']')

             default = default_map.get(default, default)
             decl = '{}={}'.format(decl, default)
         return decl

     args = []
     kwarg_only = False
     for a in decl['arguments']:
         if not kwarg_only and a.get('kwarg_only'):
             args.append('*')
             kwarg_only = True
         args.append(format_arg(a))

     arg_list = ', '.join(args)
     if len(decl['returns']) == 1:
         ret_list = jit_type_of(decl['returns'][0])
     else:
         ret_list = '({})'.format(', '.join(jit_type_of(r) for r in decl['returns']))
     return 'aten::{}({}) -> {}'.format(decl['name'], arg_list, ret_list)


 def main():
     parser = argparse.ArgumentParser(
         description='Generate JIT op dispatch')
     parser.add_argument('declarations', metavar='DECL',
                         help='path to Declarations.yaml')
     parser.add_argument('out', metavar='OUT',
                         help='path to output directory')
     parser.add_argument('template-path', metavar='TEMPLATE_PATH',
                         help='path to templates directory')
     args = parser.parse_args()
     gen_jit_dispatch(args.declarations, args.out, args.template_path)


 if __name__ == '__main__':
     main()
	import os
	import argparse
	import re
	from itertools import count, combinations, groupby
	from ..autograd.utils import CodeTemplate, write, uninplace_api_name
	from ..autograd.gen_autograd import load_aten_declarations
	from collections import OrderedDict

	# JIT has a type system of
	# Scalar = int \| float \| bool # int is the largest int (int64_t),
	# float is the largest float (double) we don't have the others because they are never held in tensors
	# Type = Scalar # primitive numbers
	# \| Tensor # any tensor, as defined by at::Tensor
	# \| Type[] # a dynamically sized list[ of a type
	# \| Scalar[N] # a homogenous fixed size scalar list, single scalars can expand to this list
	# \| (Type1, Type2, ...) # a heterogenous tuple
	# \| Layout \| ScalarType \| Device \| Generator # special singleton types for built-in concepts in tensor lib

	# clean up the variety of C++ types in the ATen declarations
	# to be in the restricted set of types that the IR represents
	# note: no default values for this map, to make it clear what types
	# can be passedthrough

	TYPE_MAP = {
	'std::array<bool,2>': 'bool[2]',
	'std::array<bool,3>': 'bool[3]',
	'std::array<bool,4>': 'bool[4]',
	'Scalar': 'Scalar',
	'Tensor': 'Tensor',
	'TensorList': 'Tensor[]',
	# this appears in return values instead of TensorList
	# since TensorList is a ArrayRef in arguments but a vector
	# in returns
	'std::vector<Tensor>': 'Tensor[]',
	'IntList': 'int[]',
	'Layout': 'Layout',
	'Device': 'Device',
	'ScalarType': 'ScalarType',
	'int64_t': 'int',
	'double': 'float',
	'bool': 'bool',
	'Generator': 'Generator',
	}


	def jit_type_of(arg):
	typ = TYPE_MAP[arg['simple_type']]
	if is_sized_intlist_arg(arg):
	typ = 'int[{}]'.format(arg['size'])

	if arg.get('is_nullable'):
	typ = '{}?'.format(typ)
	return typ


	# map from aten 'simple_type' to the function that will turn a tensor into
	# that type
	FROM_IVALUE = {
	'Device': 'as_device({}.toIntList()->elements())',
	'IntList': '{}.toIntList()->elements()',
	'Layout': 'static_cast<at::Layout>({}.toInt())',
	'Scalar': '{}.toScalar()',
	'ScalarType': 'static_cast<at::ScalarType>({}.toInt())',
	'Tensor': '{}.toTensor()',
	'TensorList': '{}.toTensorList()->elements()',
	'bool': 'bool({}.toInt())',
	'double': '{}.toDouble()',
	'int64_t': '{}.toInt()',
	'std::array<bool,2>': 'as_bool_array<2>({}.toIntList()->elements())',
	'std::array<bool,3>': 'as_bool_array<3>({}.toIntList()->elements())',
	'std::array<bool,4>': 'as_bool_array<4>({}.toIntList()->elements())',
	}


	def from_ivalue(arg, value):
	simple_type = arg['simple_type']
	return FROM_IVALUE[simple_type].format(value)


	CALL_NAMESPACE = CodeTemplate("""\
	auto result = at::${name}(
	${args}
	);
	""")
	CALL_METHOD = CodeTemplate("""\
	DeviceGuard device_guard(deviceForInputs(stack, ${num_inputs}));
	auto result = (${first}).${name}(
	${args}
	);
	""")
	CALL_TENSOR_OPTIONS = CodeTemplate("""\
	const auto options = TensorOptions()
	.dtype(${dtype})
	.layout(${layout})
	.device(${device});
	auto result = torch::${name}(
	${args},
	options
	);
	""")

	CONSTRUCTOR = CodeTemplate("""\
	[](Stack & stack) {
	autograd::profiler::RecordFunction record("${name}");
	${call}
	drop(stack, ${num_inputs});
	pack(stack, std::move(result));
	return 0;
	}
	""")

	OPERATOR = CodeTemplate("""\
	Operator(
	"${signature}",
	${op}
	),
	""")


	def is_magic_method(api_name):
	return api_name.startswith('__') and api_name.endswith('__')


	blacklisted_types = {'SparseTensorRef', 'Storage', 'ScalarType', 'optional<ScalarType>', 'std::string', 'void*'}
	default_only_types = {'Generator'}


	def is_jit_arg(i, arg):
	simple_type = arg['simple_type']
	if simple_type in blacklisted_types:
	return False
	if simple_type in default_only_types and 'default' not in arg:
	return False
	if simple_type == 'Type':
	return False
	return True


	def is_jit_op(decl):
	# We currently don't support functions that return nothing
	if all(r['type'] == 'void' for r in decl['returns']):
	return False

	# we currently only support vararg tensor lists when they are the _first_ argument
	# and the only tensor argument
	arguments = decl['arguments']

	return ((not decl['api_name'].endswith('_') or is_magic_method(decl['api_name'])) and
	not decl['name'].endswith('_out') and
	('namespace' in decl['method_of'] or 'Tensor' in decl['method_of']) and
	all(is_jit_arg(i, arg) for i, arg in enumerate(decl['arguments'])) and
	all(is_jit_arg(i, arg) for i, arg in enumerate(decl['returns'])))


	def is_tensor_arg(arg):
	return arg['simple_type'] in {'Tensor', 'TensorList'}


	def is_sized_intlist_arg(arg):
	"""Returns True for arguments declared as IntList[k], but False for IntList."""
	return (arg['simple_type'] == 'IntList') and ('size' in arg)


	def gen_jit_dispatch(declarations, out, template_path):
	REGISTER_ATEN_OPS_CPP = CodeTemplate.from_file(template_path + '/register_aten_ops.cpp')
	ATEN_INTERNED_STRINGS_H = CodeTemplate.from_file(template_path + '/aten_interned_strings.h')

	ops = []

	def get_invocation(decl, args, num_inputs):

	# because the arg list can get lengthy we put them on a separate line
	def pack_arguments(args):
	return ',\n'.join(args)
	if decl.get('has_tensor_options'):
	return CALL_TENSOR_OPTIONS.substitute(name=decl['name'],
	args=pack_arguments(args[:-3]),
	dtype=args[-3],
	layout=args[-2],
	device=args[-1])
	elif 'namespace' in decl['method_of']:
	return CALL_NAMESPACE.substitute(name=decl['name'],
	args=pack_arguments(args),
	num_inputs=num_inputs)
	else:
	return CALL_METHOD.substitute(
	name=decl['name'], first=args[0], args=pack_arguments(args[1:]),
	num_inputs=num_inputs)

	def emit_decl_variant(decl):
	kw_assignments = []
	arguments = []
	num_inputs = len(decl['arguments'])
	op_capture = ''

	real_inputs = 0
	for arg in decl['arguments']:
	if arg['simple_type'] in default_only_types:
	arguments.append(arg['default'])
	else:
	value = '(std::move(peek(stack, {}, {})))'.format(real_inputs, num_inputs)
	arguments.append(from_ivalue(arg, value))
	real_inputs += 1

	call = get_invocation(decl, arguments, num_inputs)

	returns = decl['returns']

	constructor = CONSTRUCTOR.substitute(name=decl['name'],
	call=call,
	kw_assignments=kw_assignments,
	num_inputs=num_inputs,
	op_capture=op_capture)
	return constructor

	# This function declares an order on declarations. This is necessary because
	# there is some ambiguity in the choice of overload: if an argument is overloaded
	# to accept both Scalar and Tensor, the schema with the Tensor should come first
	# TODO: this can (probably) be removed when we remove the implicit conversion
	# from Tensor -> Number.
	def sort_decls(jit_decls):
	def declkey(decl):
	# key = sum_{i < len(args)} {1 if arg is tensor else 2} * (3 ** i)
	# This is a ternary encoding where
	# 0: No argument at this position
	# 1: Tensor argument at this position
	# 2: Some other argument at this position.
	args = decl['arguments']
	result = 0
	for i in range(len(args)):
	result += (3 ** i) * (1 if args[i]['simple_type'] == 'Tensor' else 2)
	return result

	# NB: itertools.groupby requires the list be sorted.
	sorted_decls = sorted(jit_decls, key=lambda decl: decl['name'])
	grouped_decls = [list(g) for _, g in
	groupby(sorted_decls, key=lambda decl: decl['name'])]
	result = []
	for group in grouped_decls:
	sorted_decls = sorted(group, key=declkey)
	result.extend(sorted_decls)
	return result

	# We need to add methods implemented manually in TensorImpl
	tensor_impl_methods = [{
	'name': name,
	'api_name': name,
	'method_of': ['Tensor'],
	'arguments': [{'name': 'self', 'simple_type': 'Tensor'}],
	'returns': [{'name': 'result', 'type': 'int64_t', 'dynamic_type': 'int64_t', 'simple_type': 'int64_t'}],
	} for name in ['sizes', 'strides', 'dim']]
	aten_decls = load_aten_declarations(declarations) + tensor_impl_methods

	jit_decls = [d for d in aten_decls if is_jit_op(d)]

	# add arguments dtype and device for functions like zeros
	for decl in jit_decls:
	arguments = decl['arguments']
	for n, arg in enumerate(arguments):
	if arg['simple_type'] == 'TensorOptions':
	del arguments[n]
	arguments.extend([
	# XXX - until we actually have first-class interpreter types for these
	# concepts, the default values to be encoded in Tensors
	# If you change this, you also need to update [TensorOptions in script]
	# in the tracer code.
	# dtype is specified as an int64_t of at::ScalarType
	{'name': 'dtype', 'simple_type': 'ScalarType', 'default': 'float', 'kwarg_only': True},
	# layout is specified as an int64_t of at::Layout
	{'name': 'layout', 'simple_type': 'Layout', 'default': 'strided', 'kwarg_only': True},
	# device is specified as an IntList of { at::Device::Type, device_id }
	{'name': 'device', 'simple_type': 'Device', 'kwarg_only': True,
	'default': '[cpu, -1]'},
	])
	decl['has_tensor_options'] = True

	jit_decls = sort_decls(jit_decls)
	for decl in jit_decls:
	ops.append(OPERATOR.substitute(signature=signature(decl),
	op=emit_decl_variant(decl)))

	# Sort the generated snippets to ensure that the generation is deterministic
	env = {
	'constructors': ops,
	}
	write(out, 'register_aten_ops.cpp', REGISTER_ATEN_OPS_CPP, env)

	# NB: Operate on aten_decls, not jit_decls, because VariableType is
	# a client for these symbols as well
	# NB: This means we DON'T generate interned strings for inplace ops.
	# Change this when you do!
	# NB: Keep this code synchronized with the code in
	# tool/autograd/gen_variable_type.py
	# NB: Some operations have inplace versions, but NOT non-inplace
	# versions! Thus uninplace_api_name() is mandatory (if you remove
	# it, you will get missing symbols.)
	names = set(uninplace_api_name(decl['api_name']) for decl in aten_decls)
	# NB: This grabs non keyword arguments too, but it's harmless
	attrs = set(arg['name'] for decl in aten_decls for arg in decl['arguments'])
	strings_env = {
	'aten_symbols': ["_(aten, {}) \\".format(n) for n in sorted(names)],
	'attr_symbols': ["_(attr, {}) \\".format(n) for n in sorted(attrs)]
	}
	write(out, 'aten_interned_strings.h', ATEN_INTERNED_STRINGS_H, strings_env)

	default_map = {'{}': 'None', 'nullptr': 'None'}


	def signature(decl):
	def format_arg(arg):
	name = arg['name']
	typ = jit_type_of(arg)
	decl = '{} {}'.format(typ, name)
	if 'default' in arg:
	# clean up initializer lists {{true, true}} -> [true, true]
	default = str(arg['default']) \
	.replace('{{', '[') \
	.replace('}}', ']') \
	.replace('true', 'True') \
	.replace('false', 'False') \
	.replace('nullptr', 'None') \
	.replace('Reduction::ElementwiseMean', 'ElementwiseMean') \
	.replace('{}', 'None' if is_tensor_arg(arg) else '[]') \
	.replace('{', '[') \
	.replace('}', ']')

	default = default_map.get(default, default)
	decl = '{}={}'.format(decl, default)
	return decl

	args = []
	kwarg_only = False
	for a in decl['arguments']:
	if not kwarg_only and a.get('kwarg_only'):
	args.append('*')
	kwarg_only = True
	args.append(format_arg(a))

	arg_list = ', '.join(args)
	if len(decl['returns']) == 1:
	ret_list = jit_type_of(decl['returns'][0])
	else:
	ret_list = '({})'.format(', '.join(jit_type_of(r) for r in decl['returns']))
	return 'aten::{}({}) -> {}'.format(decl['name'], arg_list, ret_list)


	def main():
	parser = argparse.ArgumentParser(
	description='Generate JIT op dispatch')
	parser.add_argument('declarations', metavar='DECL',
	help='path to Declarations.yaml')
	parser.add_argument('out', metavar='OUT',
	help='path to output directory')
	parser.add_argument('template-path', metavar='TEMPLATE_PATH',
	help='path to templates directory')
	args = parser.parse_args()
	gen_jit_dispatch(args.declarations, args.out, args.template_path)


	if __name__ == '__main__':
	main()