blob: dba363de106f50f9ec3b7331f6c7af0f8607c245 [file] [log] [blame]
import inspect
import torch
import collections
import types
import textwrap
import functools
import warnings
import torch._jit_internal as _jit_internal
from torch.jit.frontend import get_default_args
from torch.nn import Module, ModuleList, Sequential, ModuleDict
from torch._six import get_function_from_type, bind_method
ScriptMethodStub = collections.namedtuple('ScriptMethodStub', ('resolution_callback', 'def_', 'original_method'))
# TODO: there should be a more principled way of doing this.
blacklist = [
"_version",
"_parameters",
"_buffers",
"_modules",
"_initializing",
"_backward_hooks",
"_forward_hooks",
"_forward_pre_hooks",
"_state_dict_hooks",
"_load_state_dict_pre_hooks",
"dump_patches",
]
def make_stub(func):
rcb = _jit_internal.createResolutionCallbackFromClosure(func)
ast = torch.jit.get_jit_def(func, self_name="RecursiveScriptModule")
return ScriptMethodStub(rcb, ast, func)
def make_stub_from_method(nn_module, method):
func = get_function_from_type(type(nn_module), method)
if isinstance(func, ScriptMethodStub):
return func
return make_stub(func)
# base types that can be constants
# in addition, tuples and lists of these base types are also considered constants
# If you edit this list, then you also need to edit the handlers in
# ConstantValue in jit/script/init.cpp
_constant_types = (bool, float, int, str, type(None), types.FunctionType, torch.device, torch.layout, torch.dtype)
def _get_valid_constant(attr, v):
if isinstance(v, _constant_types):
return v
elif isinstance(v, tuple) or isinstance(v, list):
return tuple(_get_valid_constant(attr, x) for x in v)
constants = ", ".join(typ.__name__ for typ in _constant_types)
raise TypeError(textwrap.dedent("""
'{}' object for attribute '{}' is not a valid constant.
Valid constants are:
1. a nn.ModuleList
2. a value of type {{{}}}
3. a list or tuple of (2)
""".format(type(v).__name__, attr, constants)))
def infer_raw_concrete_type(nn_module):
"""
Build a ConcreteModuleType from an nn.Module. This ConcreteModuleType
doesn't have a JIT type associated with it yet, it must be filled in
by the caller.
"""
concrete_type = torch._C.ConcreteModuleType()
concrete_type.add_pyclass(type(nn_module))
if isinstance(nn_module, (torch.nn.ModuleDict, torch.jit._ConstModuleDict)):
concrete_type.set_module_dict()
if isinstance(nn_module, (torch.nn.ModuleList, torch.nn.Sequential, torch.jit._ConstModuleList)):
concrete_type.set_module_list()
added_names = set()
for name, item in nn_module._parameters.items():
if item is None:
# TODO special case: parameters can be None. The JIT assumes
# parameters are Tensor types, so in this case just add it as a
# attribute.
# The "correct" fix here is to add the parameter as a NoneType
# attribute, but NoneType refinemenet is currently wonky
continue
assert isinstance(item, torch.Tensor)
attr_type = torch._C._jit_try_infer_type(item)
concrete_type.add_attribute(name, attr_type, True)
added_names.add(name)
for name, item in nn_module._modules.items():
sub_concrete_type = concrete_type_store.get_or_create_concrete_type(item)
concrete_type.add_module(name, sub_concrete_type)
added_names.add(name)
for name, item in nn_module._buffers.items():
if item is None:
# TODO special case: parameters can be None. The JIT assumes
# parameters are Tensor types, so in this case just add it as a
# attribute
# The "correct" fix here is to add the parameter as a NoneType
# attribute, but NoneType refinemenet is currently wonky
continue
assert isinstance(item, torch.Tensor)
attr_type = torch._C._jit_try_infer_type(item)
concrete_type.add_attribute(name, attr_type, False)
added_names.add(name)
# populate constants_set
constants_set = getattr(nn_module, "__constants__", set())
# Constants annotated via `Final[T]` rather than being added to `__constants__`
for name, ann in getattr(nn_module, '__annotations__', {}).items():
if torch._jit_internal.is_final(ann):
constants_set.add(name)
for name in constants_set:
if name in added_names:
# XXX: It is possible for something to be in the constants set but
# also in the parameters/buffers. This happens in BatchNorm as a
# hack to support optional parameters.
continue
if not hasattr(nn_module, name):
# TODO: We should really error in this case, but there are a couple
# extant examples of this so leave it for a future PR.
warnings.warn("'{}' was found in ScriptModule constants, "
"but was not actually set in __init__. "
"Consider removing it.".format(name))
continue
value = getattr(nn_module, name)
concrete_type.add_constant(name, _get_valid_constant(name, value))
added_names.add(name)
# populate overloads
overloads = getattr(nn_module, "__overloads__", {})
# update with any annotated overloads
overloads.update(get_overload_name_mapping(get_overload_annotations(nn_module)))
for name, overloaded_names in overloads.items():
concrete_type.add_overload(name, overloaded_names)
class_annotations = getattr(nn_module, '__annotations__', {})
# TODO: [switch to __dict__]
# we should use __dict__ here because we only want to pick up attributes on
# this module instance, not the class itself. We can't do it right now
# because there is code that relies on properties being turned into attributes.
# This is wrong (the property function is only evaluated once then "saved"
# as an attribute), so we should fix that and then switch this to using __dict__
for name in dir(nn_module):
if name in blacklist or name.startswith("__"):
# Python objects have lots of random attributes attached to them;
# PyTorch adds a few more. Prevent these from getting compiled.
continue
if name in added_names:
# Don't re-add anything we already added
continue
if not hasattr(nn_module, name):
# TODO: delete this when [switch to __dict__]
continue
item = getattr(nn_module, name)
if name not in nn_module.__dict__ and not isinstance(getattr(type(nn_module), name, None), property):
# Skip class attributes that aren't properties
# TODO: delete this when [switch to __dict__]
continue
if inspect.isfunction(item) and not inspect.ismethod(item):
cls_attr = getattr(type(nn_module), name, None)
if inspect.isfunction(cls_attr):
# Skip function attributes that exist on the nn_module class.
# TODO: delete this when [switch to __dict__]
continue
# This is a Python function attribute. Try to script it.
try:
item = torch.jit.script(item)
except Exception as e:
# If we fail to script the function, it isn't a hard error.
# Instead, we will add it to the list of attributes we failed
# to convert, with the compilation error.
hint = ("(This function exists as an attribute on the Python module, "
"but we failed to compile it to a TorchScript function. "
"\nThe error stack is reproduced here:\n{}").format(e)
concrete_type.add_failed_attribute(name, hint)
pass
if name in class_annotations:
attr_type = torch.jit.annotations.ann_to_type(class_annotations[name])
elif isinstance(item, torch.jit.Attribute):
attr_type = torch.jit.annotations.ann_to_type(item.type)
else:
attr_type = torch._C._jit_try_infer_type(item)
if attr_type is not None:
concrete_type.add_attribute(name, attr_type, False)
else:
# TODO: could add more detail here. For example, what the user should do
# when the pytype is `list` or `NoneType`
hint = ("(This attribute exists on the Python module, "
"but we failed to convert Python type: '{}' "
"to a TorchScript type.)").format(type(item).__name__)
concrete_type.add_failed_attribute(name, hint)
return concrete_type
class ConcreteTypeStore(object):
def __init__(self):
# Python module type => List[ConcreteModuleType)]
self.type_store = {}
# ConcreteTypes that have had their methods already compiled
self.methods_compiled = set()
def get_or_create_concrete_type(self, nn_module):
"""
Infer a ConcreteType from this `nn.Module` instance. Underlying JIT
types are re-used if possible.
"""
assert isinstance(nn_module, Module)
if isinstance(nn_module, torch.jit.ScriptModule) and \
hasattr(nn_module, "_concrete_type"):
return nn_module._concrete_type
if isinstance(nn_module, (torch.nn.ModuleList, torch.nn.Sequential, torch.nn.ModuleDict)):
# TODO: This is here because the compilation path for constant iterable
# modules is different from everything else. Instead of calling
# create_script_module, we directly create a
# _ConstSequential/ModuleList/ModuleDict instance.
#
# The path used to create ConcreteTypes involves going in and analyzing
# all the nn.Modules ahead of time.
#
# That leads to skew where the result of generating a ConcreteType
# (which involves looking at torch.nn.Sequential) is different from the
# actual compilation path (which directly builds _ConstSequential).
#
# The right solution is to make these modules not special in the
# compilation path. But for now, just mimic what compilation does when
# generating a ConcreteType
scripted = create_constant_iterable_module(nn_module)
return scripted._concrete_type
raw_concrete_type = infer_raw_concrete_type(nn_module)
nn_module_type = type(nn_module)
if nn_module_type not in self.type_store:
self.type_store[nn_module_type] = []
# Search the type store for an already-available JIT type
known_types = self.type_store[nn_module_type]
found = False
for known_type in known_types:
if raw_concrete_type.equals(known_type):
return known_type
# We didn't find anything; generate a new JIT type from this concrete type
raw_concrete_type.create_new_type_from_this()
self.type_store[nn_module_type].append(raw_concrete_type)
return raw_concrete_type
concrete_type_store = ConcreteTypeStore()
def create_methods_from_stubs(concrete_type, stubs):
defs = [m.def_ for m in stubs]
name = [def_.name().name for def_ in defs]
rcbs = [m.resolution_callback for m in stubs]
defaults = [get_default_args(m.original_method) for m in stubs]
concrete_type._create_methods(defs, rcbs, defaults)
def create_script_module_for_tracing(nn_module, stubs):
"""
Creates a new ScriptModule from an nn.Module, but always uses a fresh type.
NOTE: Only use this when we cannot guarantee type sharing will work
correctly. This only happens today for traced modules, where the same
module can produce different traced methods depending on the inputs.
Arguments:
nn_module: The original Python nn.Module that we are creating a ScriptModule for
stubs: ScriptMethodStubs to compile as part of the conversion process.
"""
check_module_initialized(nn_module)
# Get a ConcreteType without a JIT type. We will generate one ourselves
# and fill it in.
concrete_type = infer_raw_concrete_type(nn_module)
cpp_module = torch._C.ScriptModule(torch._jit_internal._qualified_name(type(nn_module)),
torch.jit._python_cu,
True)
# Poison this concrete type to ensure that it never gets re-used
concrete_type.set_poisoned()
concrete_type.add_jit_type(cpp_module._type())
return create_script_module_impl(nn_module, concrete_type, cpp_module, stubs)
def create_script_module(nn_module, stubs):
"""
Creates a new ScriptModule from an nn.Module, sharing underlying JIT types if possible
Arguments:
nn_module: The original Python nn.Module that we are creating a ScriptModule for
stubs: ScriptMethodStubs to compile as part of the conversion process.
"""
check_module_initialized(nn_module)
concrete_type = concrete_type_store.get_or_create_concrete_type(nn_module)
cpp_module = torch._C._create_module_with_type(concrete_type.jit_type)
return create_script_module_impl(nn_module, concrete_type, cpp_module, stubs)
def create_script_module_impl(nn_module, concrete_type, cpp_module, stubs):
"""
Convert an nn.Module to a RecursiveScriptModule.
Arguments:
nn_module: The original Python nn.Module that we are creating a ScriptModule for
concrete_type: The fully initialized ConcreteType of the module.
cpp_module: A newly-constructed C++ script::Module to copy stuff into.
stubs: ScriptMethodStubs to compile as part of the conversion process.
"""
assert concrete_type.jit_type and concrete_type.jit_type == cpp_module._type()
def init_fn(script_module):
# Initialize the ScriptModule:
# 1. Copy the attributes/parameters/buffers from the original `nn_module` to the new ScriptModule.
for name, (attr_type, is_param) in concrete_type.get_attributes().items():
orig_value = getattr(nn_module, name)
if is_param:
cpp_module._register_parameter(name, orig_value, False)
elif isinstance(orig_value, torch.jit.Attribute):
cpp_module._register_attribute(name, attr_type, orig_value.value)
else:
cpp_module._register_attribute(name, attr_type, orig_value)
# 2. Copy the submodules from the original `nn_module` to the new ScriptModule,
# recursively scripting them.
for name in concrete_type.get_module_names():
orig_value = getattr(nn_module, name)
assert isinstance(orig_value, Module)
scripted = recursive_script(orig_value)
cpp_module._register_module(name, scripted._c)
script_module._modules[name] = scripted
# 3. Copy @ignored/@unused methods from the original `nn_module` to the new ScriptModule.
# This ensures we can access these Python methods on the ScriptModule.
for name in dir(nn_module):
item = getattr(nn_module, name, None)
if not inspect.ismethod(item):
continue
if _jit_internal.is_ignored_fn(item):
setattr(script_module, name, item)
# For convenience, attach the concrete type to the new ScriptModule
script_module._concrete_type = concrete_type
# Actually create the ScriptModule, initializing it with the function we just defined
script_module = torch.jit.RecursiveScriptModule._construct(cpp_module, init_fn)
# Compile methods if necessary
if concrete_type not in concrete_type_store.methods_compiled:
create_methods_from_stubs(concrete_type, stubs)
torch._C._run_emit_module_hook(cpp_module)
concrete_type_store.methods_compiled.add(concrete_type)
# Make the compiled methods available to the Python ScriptModule class.
for stub in stubs:
if stub.original_method is None:
# define()'d methods don't have an Python original_method, so we
# don't need to do any Python re-wrapping stuff
continue
name = stub.original_method.__name__
if name != stub.def_.name().name:
# TODO: Why skip this? Because @torch.jit._overload_method will
# mangle the name of the function.
continue
script_method = cpp_module._get_method(name)
# Wrap the original to propagate docstrings and such.
# TODO: we don't currently do this functions that are recursively
# compiled, we should.
script_method = functools.wraps(stub.original_method)(script_method)
# Add the methods to the script_module directly. This ensures they will
# be found first when `name` is looked up (as opposed to the stubs or
# nn.Module.forward)
script_module.__dict__[name] = script_method
return script_module
def get_overload_annotations(mod):
# original function => [(mangled overload name, overload function)]
overloads = {}
for name in dir(mod):
item = getattr(mod, name, None)
if not callable(item):
continue
# builtin functions like repr() in python 2 do not have __module__ defined
if hasattr(item, "__module__") and item.__module__ is not None:
method_overloads = _jit_internal._get_overloaded_methods(item, mod.__class__)
if method_overloads is None:
continue
original_name = item.__name__
names = [name + "__" + str(i) for i in range(len(method_overloads))]
overloads[item] = list(zip(names, method_overloads))
return overloads
def get_overload_name_mapping(overload_info):
# Same format as __overloads__
# original function => [overload names]
overload_name_mappings = {}
for orig_fn, overloads in overload_info.items():
original_name = orig_fn.__name__
if original_name not in overload_name_mappings:
overload_name_mappings[original_name] = []
for overload_name, _ in overloads:
overload_name_mappings[original_name].append(overload_name)
return overload_name_mappings
def make_stubs_for_overloads(overload_info):
overload_stubs = []
for orig_fn, overloads in overload_info.items():
orig_ast = torch.jit.get_jit_def(orig_fn, self_name="RecursiveScriptModule")
for overload_name, overload_fn in overloads:
torch.jit._check_no_signature(overload_fn)
over_ast = torch.jit.get_jit_def(overload_fn, self_name="RecursiveScriptModule")
new_ast = torch._C._replace_overloaded_method_decl(over_ast.decl(), orig_ast, overload_name)
_rcb = _jit_internal.createResolutionCallbackFromClosure(orig_fn)
overload_stubs.append(ScriptMethodStub(_rcb, new_ast, overload_fn))
return overload_stubs
def check_module_initialized(mod):
assert isinstance(mod, torch.nn.Module)
if not hasattr(mod, '_parameters'):
raise RuntimeError("'{}' has not been initialized, did you forget to call 'super()'?"
.format(type(mod).__name__))
def infer_methods_to_compile(nn_module):
"""
Implements the default rules for which methods should act as starting
points for compilation (TODO add a link when the rules are published).
"""
check_module_initialized(nn_module)
methods = []
if hasattr(nn_module, 'forward'):
if getattr(nn_module.forward, "__func__", None) == torch.nn.Module.forward:
# TODO, we deleted a check that forward is actually defined, instead skipping it
pass
elif not _jit_internal.is_ignored_fn(nn_module.forward):
methods = ['forward']
exported = []
for name in dir(nn_module):
item = getattr(nn_module, name, None)
if _jit_internal.get_torchscript_modifier(item) is _jit_internal.FunctionModifiers.EXPORT:
exported.append(name)
methods = methods + exported
overload_name_mappings = dict(getattr(nn_module, "__overloads__", {}))
overload_info = get_overload_annotations(nn_module)
overload_name_mappings.update(get_overload_name_mapping(overload_info))
overload_stubs = make_stubs_for_overloads(overload_info)
nn_module.__overloads__ = overload_name_mappings
# we shouldn't directly compile overloaded methods, just its overloads
def ignore_overloaded(method_name):
return method_name not in overload_name_mappings
filtered_methods = filter(ignore_overloaded, methods)
# Unique the methods. We don't want to use a set to store the methods because it
# introduces non-determinism to compile order.
uniquer = set()
uniqued_methods = []
for name in filtered_methods:
if name in uniquer:
continue
uniqued_methods.append(name)
uniquer.add(name)
stubs = []
for method in uniqued_methods:
stubs.append(make_stub_from_method(nn_module, method))
return overload_stubs + stubs
def recursive_script(nn_module):
"""
Makes a ScriptModule from an nn.Module, using the default rules for
determining which methods to compile.
"""
if isinstance(nn_module, torch.jit.ScriptModule):
return nn_module
check_module_initialized(nn_module)
if isinstance(nn_module, (torch.nn.ModuleList, torch.nn.Sequential, torch.nn.ModuleDict)):
# Create constant versions for the iterable modules
return create_constant_iterable_module(nn_module)
return create_script_module(nn_module, infer_methods_to_compile(nn_module))
def try_compile_fn(fn, loc):
if _jit_internal.is_ignored_fn(fn):
# Don't do anything for @ignore'd functions
return None
if isinstance(fn, torch.nn.Module):
# Since modules are callable pybind recognizes them as functions, but
# don't do anything for them
return None
if not inspect.isfunction(fn) and not inspect.ismethod(fn):
raise RuntimeError("`{}` is not a function. Recursive scripting only supports "
"Python functions or methods currently.\n"
"Consider manually annotating `{}` with @torch.jit.script.".format(fn, fn))
# We don't have the actual scope where the function was defined, but we can
# extract the necessary info from the closed over variables on the function
# object
rcb = _jit_internal.createResolutionCallbackFromClosure(fn)
return torch.jit.script(fn, _rcb=rcb)
def create_constant_iterable_module(module):
modules = collections.OrderedDict()
for key, submodule in module._modules.items():
if isinstance(submodule, (ModuleList, Sequential, ModuleDict)):
# Make each item in the module a constant
modules[key] = create_constant_iterable_module(submodule)
else:
modules[key] = recursive_script(submodule)
if isinstance(module, Sequential):
return torch.jit._ConstSequential(Sequential(modules))
elif isinstance(module, ModuleList):
return torch.jit._ConstModuleList(modules)
elif isinstance(module, ModuleDict):
return torch.jit._ConstModuleDict(modules)
else:
raise RuntimeError("Only nn.ModuleList, nn.Sequential, and nn.ModuleDict can be made "
"into constant modules, found {}".format(module))
def wrap_cpp_module(cpp_module):
"""
Wrap this torch._C.ScriptModule in a Python ScriptModule, recursively for all submodules
"""
def init_fn(script_module):
for name, cpp_module in script_module._c._get_modules():
setattr(script_module, name, wrap_cpp_module(cpp_module))
return torch.jit.RecursiveScriptModule._construct(cpp_module, init_fn)
def compile_unbound_method(concrete_type, fn):
if _jit_internal.is_ignored_fn(fn):
return None
stub = make_stub(fn)
with torch.jit._disable_emit_hooks():
# We don't want to call the hooks here since the graph that is calling
# this function is not yet complete
create_methods_from_stubs(concrete_type, (stub,))
return stub
def lazy_bind(concrete_type, unbound_method):
"""
Returns a function that lazily binds `unbound_method` to a provided
Module IValue, then invokes the method. We do this so that any Python
shenanigans that will poison type sharing are impossible at compile
time.
"""
def lazy_binding_method(cpp_module, *args):
def init_fn(script_module):
orig_class = concrete_type.py_class
# Copy @ignored/@unused methods from the original module to the new one.
# This ensures they are available during execution.
for name in dir(orig_class):
item = getattr(orig_class, name, None)
if _jit_internal.is_ignored_fn(item):
setattr(script_module, name, item)
# Copy constants over so they are available during execution.
for name, value in concrete_type.get_constants().items():
setattr(script_module, name, value)
script_module = torch.jit.RecursiveScriptModule._construct(cpp_module, init_fn)
method = bind_method(unbound_method, script_module, torch.jit.RecursiveScriptModule)
return method(*args)
# make the lazy binding method "look like" the original method
lazy_binding_method.original_fn = unbound_method
lazy_binding_method.__name__ = unbound_method.__name__
torch._jit_internal.copy_torchscript_modifier(unbound_method, lazy_binding_method)
return lazy_binding_method