torch/csrc/jit/tracer.cpp - platform/external/pytorch - Git at Google

 #include <torch/csrc/jit/tracer.h>

 #include <c10/util/Exception.h>
 #include <torch/csrc/autograd/engine.h>
 #include <torch/csrc/autograd/function.h>
 #include <torch/csrc/autograd/variable.h>
 #include <torch/csrc/jit/passes/dead_code_elimination.h>
 #include <torch/csrc/jit/passes/remove_expands.h>

 #include <memory>
 #include <sstream>
 #include <string>

 namespace torch {
 namespace jit {
 namespace tracer {

 ////////////////////////////////////////////////////////////////////////////////
 // Recording the traces
 ////////////////////////////////////////////////////////////////////////////////
 namespace detail {

 template <typename T>
 void genericAddInput(Node* n, T value) {
   Value* v = n->owningGraph()->insertConstant(value);
   recordSourceLocation(v->node());
   n->addInput(v);
 }

 template <typename T>
 void badArgType(const T& v) {
   AT_ERROR(
       "Found an unsupported argument type in the JIT tracer: ",
       c10::demangle_type<T>(),
       ". File a bug report.");
 }

 thread_local std::shared_ptr<TracingState> tracing_state;

 } // namespace detail

 TORCH_API std::function<void()> pauseTracing() {
   // NOLINTNEXTLINE
   std::shared_ptr<tracer::TracingState> state = getTracingState();
   tracer::setTracingState(nullptr);

   return [state]() { tracer::setTracingState(state); };
 }

  void delValueTrace(const Variable& var) {
   AT_ASSERT(var.defined());
   auto& env_stack = getTracingState()->env_stack;
   for (size_t i = 0; i < env_stack.size(); ++i) {
     auto& value_map = env_stack.at(env_stack.size() - 1 - i).value_map;

     auto it = value_map.find(var);
     if (it == value_map.end()) {
       continue;
     }
     value_map.erase(it);
   }
   getTracingState()->env_stack.back().value_map.erase(var);
 }

 // Given a variable 'var', return the 'node' which represents the instruction
 // which computes the value of this variable in the IR.
 // Here, we interpret untraced variables as constants that are just embedded
 // in the graph.  This is useful to handle code which does things like this
 // (from torch.autograd.variable, now moved to C++):
 //
 //    def mm(self, matrix):
 //      output = Variable(self.data.new(self.data.size(0), matrix.data.size(1)))
 //      return Addmm.apply(output, self, matrix, 0, 1, True)
 //
 // Here, mm fakes up a dummy variable with uninitialized data to do an inplace
 // update on, but subsequently ignores it because the alpha scaling factor is
 // zero. This is one of the cases where a Variable can be created inside of a
 // trace, and if we treat it as a constant, everything will work out.
 Value* getValueTrace(const IValue& var) {
   auto& state = getTracingState();
   auto& env_stack = getTracingState()->env_stack;

   if (var.isTensor()) {
     auto ten = var.toTensor();
     if (!ten.defined()) {
       Node* n = state->graph->createUndefined();
       return state->graph->insertNode(n)->output();
     }
     for (size_t i = 0; i < env_stack.size(); ++i) {
       auto& value_map = env_stack.at(env_stack.size() - 1 - i).value_map;
       auto it = value_map.find(ten);
       if (it == value_map.end()) {
         continue;
       }
       if (!it->second->hasUniqueName()) {
         auto unique_name = getTracingState()->lookup_var_name_fn(ten);
         if (!unique_name.empty()) {
           it->second->setUniqueName(unique_name);
         }
       }
       return it->second;
     }

     // Didn't find it. Bake in a constant
     Value* constant = state->graph->insertConstant(ten);
     recordSourceLocation(constant->node());
     constant->inferTypeFrom(ten);
     auto it = env_stack.back().value_map.find(ten);
     it = env_stack.back().value_map.emplace_hint(it, ten, constant);
     return it->second;
   } else if (var.isFuture()) {
     auto fut = var.toFuture();
     for (size_t i = 0; i < env_stack.size(); ++i) {
       auto& future_map = env_stack.at(env_stack.size() - 1 - i).future_map;
       auto it = future_map.find(fut);
       if (it == future_map.end()) {
         continue;
       }
       return it->second;
     }

     std::ostringstream oss;
     oss << "Tried to trace Future that the tracer was not aware of.";
     throw std::runtime_error(oss.str());
   } else {
     std::ostringstream oss;
     oss << "Unknown type used in value trace lookup!";
     throw std::runtime_error(oss.str());
   }
 }

 // allow tracing of tuples passed to List[Tensor] or Tuple[Tensor...] arguments
 // One might merge getValueTrace and getNestedValueTrace after checking that
 // casting to IValue instead  of Variable is OK
 Value* getNestedValueTrace(const IValue& v) {
   auto& state = getTracingState();
   if (v.isTensorList()) {
     return state->graph
         ->insertNode(state->graph->createList(
             DynamicType::get(),
             fmap(
                 v.toTensorListRef(),
                 [](const IValue& val) { return getNestedValueTrace(val); })))
         ->output();
   } else if (v.isTuple()) {
     return state->graph
         ->insertNode(state->graph->createTuple(fmap(
             v.toTuple()->elements(),
             [](const IValue& val) { return getNestedValueTrace(val); })))
         ->output();
   }
   return getValueTrace(v.toTensor());
 }

 Value* getOutputTrace(
     const std::shared_ptr<TracingState>& state,
     const Variable& var) {
   if (!var.defined()) {
     Node* n = state->graph->createUndefined();
     return state->graph->insertNode(n)->output();
   }

   auto& value_map = getTracingState()->env_stack.back().value_map;
   auto it = value_map.find(var);
   if (it == value_map.end()) {
     std::ostringstream os;
     os << "output of traced region did not have observable "
        << "data dependence with trace inputs; this probably indicates your program "
        << "cannot be understood by the tracer.";
     throw std::runtime_error(os.str());
   }
   return it->second;
 }

 Value* getNestedOutputTrace(
     const std::shared_ptr<TracingState>& state,
     const IValue& iv) {
   if (iv.isTensor()) {
     return getOutputTrace(state, iv.toTensor());
   } else if (iv.isTuple()) {
     const auto& elems = iv.toTuple()->elements();
     auto tuple_node = state->graph->createTuple(
         fmap(elems, [&state](const IValue& iv) {
           return getNestedOutputTrace(state, iv);
         }));
     state->graph->insertNode(tuple_node);
     return tuple_node->output();
   } else {
     AT_ERROR(
         "Only tensors or tuples of tensors can be output from traced functions");
   }
 }

 // Start tracing, treating 'inputs' as inputs to the trace, which can be
 // varied on subsequent invocations of the trace.  Any other variables
 // will be treated as constants.
 std::pair<std::shared_ptr<TracingState>, Stack> enter(Stack inputs) {
   if (isTracing()) {
     AT_ERROR("Tracing can't be nested");
   }
   auto state = std::make_shared<TracingState>();
   setTracingState(state);
   // XXX: this function mutates input
   const std::function<IValue(IValue, TypePtr, Value*)> add_input =
       [&](IValue input, TypePtr type, Value* value) -> IValue {
     value->setType(type);
     if (type->isSubtypeOf(DynamicType::get())) {
       auto input_tensor = input.toTensor();
       auto name = Variable(input_tensor).name();
       auto& value_map = state->env_stack.back().value_map;
       if (value_map.find(input_tensor) != value_map.end()) {
         input_tensor = input_tensor.view(input_tensor.sizes());
       }
       value->setUniqueName(name);
       value_map[input_tensor] = value;
       return input_tensor;
     } else if (auto tuple_type = type->cast<TupleType>()) {
       auto unpack_node =
           state->graph->insertNode(state->graph->createTupleUnpack(value));
       auto elem_values = unpack_node->outputs();
       auto elem_types = tuple_type->elements();
       Stack elems = input.toTuple()->elements();
       size_t num_elems = elems.size();
       AT_ASSERT(
           elem_values.size() == num_elems && elem_types.size() == num_elems);
       for (size_t i = 0; i < num_elems; ++i) {
         elems[i] = add_input(elems[i], elem_types[i], elem_values[i]);
       }
       return Tuple::create(std::move(elems));
     } else {
       AT_ERROR(
           "Only tensors or tuples of tensors can be inputs to traced functions");
     }
   };
   for (IValue& input : inputs) {
     input = add_input(
         input, incompleteInferTypeFrom(input), state->graph->addInput());
   }
   return std::make_pair(state, inputs);
 }

 // Exit a trace, treating 'outputs' as the outputs of the trace.  These
 // are the variables whose values will be computed upon subsequent
 // invocations of the trace.
 void exit(const Stack& outputs) {
   auto& state = getTracingState();
   size_t i = 0;
   for (auto& output : outputs) {
     state->graph->registerOutput(getNestedOutputTrace(state, output));
     i++;
   }
   setTracingState(nullptr);
 }

 // Abort tracing. Used to reset the state in case of errors.
 void abandon() {
   setTracingState(nullptr);
 }

 void setValueTrace(const IValue& v, Value* value) {
   if (v.isTensor()) {
     auto var = v.toTensor();
     AT_ASSERT(var.defined());
     getTracingState()->env_stack.back().value_map[var] = value;
   } else if (v.isTensorList()) {
     auto& outputs = v.toTensorList()->elements();
     auto graph = getTracingState()->graph;
     Node* unpack_node =
         graph->insertNode(graph->createListUnpack(value, outputs.size()));
     for (size_t i = 0; i < outputs.size(); ++i) {
       setValueTrace(outputs[i], unpack_node->outputs()[i]);
     }
   } else if (v.isTuple()) {
     auto& outputs = v.toTuple()->elements();
     auto graph = getTracingState()->graph;
     Node* unpack_node = graph->insertNode(graph->createTupleUnpack(value));
     for (size_t i = 0; i < outputs.size(); ++i) {
       setValueTrace(outputs[i], unpack_node->outputs()[i]);
     }
   } else if (v.isGenericList()) {
     auto elements = v.toGenericListRef();
     auto graph = getTracingState()->graph;
     Node* unpack_node =
         graph->insertNode(graph->createListUnpack(value, elements.size()));
     for (size_t i = 0; i < elements.size(); ++i) {
       setValueTrace(elements[i], unpack_node->outputs()[i]);
     }
   } else if (v.isFuture()) {
     auto fut = v.toFuture();
     getTracingState()->env_stack.back().future_map[fut] = value;
   } else {
     std::ostringstream os;
     os << "Tracer cannot set value trace for type " << v.tagKind() << ". "
        << "Supported types are tensor, tensor list, and tuple of tensors.";
     throw std::runtime_error(os.str());
   }
 }

 void addInputs(Node* n, const char* name, int64_t value) {
   using ArgumentStash = jit::tracer::ArgumentStash;
   if (ArgumentStash::hasValue(name)) {
     Value* v = ArgumentStash::popValue(name);
     n->addInput(v);
   } else {
     detail::genericAddInput(n, value);
   }
 }

 void addInputs(Node* n, const char* name, c10::optional<int64_t> value) {
   if (value) {
     detail::genericAddInput(n, *value);
   } else {
     Graph* g = n->owningGraph();
     Value* none = g->insertNode(g->createNone(IntType::get()))->output();
     n->addInput(none);
   }
 }
 void addInputs(Node* n, const char* name, bool value) {
   detail::genericAddInput(n, value);
 }
 void addInputs(Node* n, const char* name, double value) {
   detail::genericAddInput(n, value);
 }
 void addInputs(Node* n, const char* name, const at::Scalar& value) {
   detail::genericAddInput(n, value);
 }
 void addInputs(
     Node* n,
     const char* name,
     const c10::optional<at::Scalar>& value) {
   if (value) {
     detail::genericAddInput(n, *value);
   } else {
     Graph* g = n->owningGraph();
     Value* none = g->insertNode(g->createNone(NumberType::get()))->output();
     n->addInput(none);
   }
 }
 void addInputs(Node* n, const char* name, const std::string& value) {
   detail::genericAddInput(n, value);
 }
 void addInputs(Node* n, const char* name, const at::Tensor& value) {
   n->addInput(getValueTrace(value));
 }
 void addInputs(Node* n, const char* name, const at::SparseTensorRef& value) {
   detail::badArgType(value);
 }
 void addInputs(Node* n, const char* name, at::Generator* value) {
   if (value) {
     detail::badArgType(value);
   }
   Graph* g = n->owningGraph();
   Value* undef_gen =
       g->insertNode(g->createNone(GeneratorType::get()))->output();
   n->addInput(undef_gen);
 }
 void addInputs(Node* n, const char* name, at::Device value) {
   detail::genericAddInput(n, value);
 }
 void addInputs(Node* n, const char* name, at::Layout value) {
   detail::genericAddInput(n, static_cast<int64_t>(value));
 }
 void addInputs(Node* n, const char* name, at::ScalarType value) {
   detail::genericAddInput(n, static_cast<int64_t>(value));
 }
 void addInputs(
     Node* n,
     const char* name,
     const c10::optional<at::ScalarType>& value) {
   if (value) {
     detail::genericAddInput(n, static_cast<int64_t>(*value));
   } else {
     Graph* g = n->owningGraph();
     Value* none = g->insertNode(g->createNone(IntType::get()))->output();
     n->addInput(none);
   }
 }

 void addInputs(Node* n, const char* name, at::TensorList value) {
   Graph* g = n->owningGraph();
   Node* list_node = g->insertNode(
       g->createList(DynamicType::get(), fmap(value, getValueTrace)));
   n->addInput(list_node->output());
 }

 void addInputs(Node* n, const char* name, const at::TensorOptions& options) {
   // [TensorOptions in script] - update this when you change how we schematize
   // TensorOptions
   addInputs(n, name, at::typeMetaToScalarType(options.dtype()));
   addInputs(n, name, options.layout());
   addInputs(n, name, options.device());
 }

 void addInputs(Node* n, const char* name, at::IntList value) {
   using ArgumentStash = jit::tracer::ArgumentStash;
   std::vector<Value*> info = ArgumentStash::hasIntList(name)
       ? ArgumentStash::popIntList(name)
       : ArgumentStash::IntListTrace(value.size());

   auto& g = getTracingState()->graph;
   for (size_t i = 0; i < info.size(); ++i) {
     if (info[i] != nullptr)
       continue;
     info[i] = g->insertConstant(value[i]);
     recordSourceLocation(info[i]->node());
   }
   for (jit::Value* v : info) {
     if (*v->type() != *jit::IntType::get()) {
       throw std::runtime_error(
           "Type mismatch in setposattr for IntList. Check that your program "
           "is valid without tracing, and please file a bug report if it is.");
     }
   }
   n->addInput(
       g->insertNode(g->createList(jit::IntType::get(), info))->output());
 }

 void addInputs(Node* n, const char* name, const ArrayRef<double>& value) {
   AT_ERROR("Tracing float lists currently not supported!");
 }

 void addOutput(Node* node, const at::Tensor& output) {
   setOutput(node->addOutput(), output);
 }

 void setOutput(Value* value, const at::Tensor& output) {
   if (output.defined()) {
     value->inferTypeFrom(output);
     setValueTrace(autograd::as_variable_ref(output), value);
   }
 }

 void addOutput(Node* node, const std::vector<at::Tensor>& outputs) {
   Value* value = node->addOutput()->setType(ListType::ofTensors());
   Graph* graph = node->owningGraph();
   Node* unpack_node = graph->insertNode(
       graph->create(prim::ListUnpack, {value}, outputs.size()));
   for (size_t i = 0; i < outputs.size(); ++i) {
     Value* output_val = unpack_node->outputs()[i];
     output_val->inferTypeFrom(outputs[i]);
     setValueTrace(outputs[i], output_val);
   }
 }

 const std::shared_ptr<TracingState>& getTracingState() {
   return detail::tracing_state;
 }

 void setTracingState(std::shared_ptr<TracingState> state) {
   detail::tracing_state = std::move(state);
 }

 TracingState::TracingState()
     : env_stack{TracingEnvironmentFrame()}, graph(new Graph()) {}

 TracingState::~TracingState() = default;

 autograd::Variable getSizeOf(const autograd::Variable& var, int64_t dim) {
   auto& tracing_state = getTracingState();
   auto& graph = tracing_state->graph;

   auto size_var =
       autograd::make_variable(scalar_to_tensor(at::Scalar(var.size(dim))));
   auto* value = getValueTrace(var);
   auto dim_val = graph->insertConstant(dim);
   recordSourceLocation(dim_val->node());
   auto* node = graph->insertNode(graph->create(aten::size, {value, dim_val}));
   recordSourceLocation(node);
   node->output()->setType(jit::IntType::get());

   auto ten =
       graph->insertNode(graph->createNumToTensor(node->output()))->output();
   setValueTrace(size_var, ten);
   return size_var;
 }

 void ensureUniqueIfOutOfPlaced(
     const char* name,
     const at::Tensor& tensor) {
   auto& state = getTracingState();
   if (state && state->force_outplace == false) {
     // If we're not converting in-place ops to out-of-place, this check is
     // unnecessary
     return;
   }
   auto aliases = tensor.storage().use_count();
   if (isTracing() && aliases > 1) {
     std::stringstream ss;
     ss << "There are " << aliases
        << " live references to the data region being modified when tracing in-place operator "
        << name
        << ". This might cause the trace to be incorrect, because all other views "
        << "that also reference this data will not not reflect this change in the trace! "
        << "On the other hand, if all other views use the same memory chunk, but are disjoint (e.g. "
        << "are outputs of torch.split), this might still be safe.";
     warn(ss.str().c_str());
   }
 }

 ////////////////////////////////////////////////////////////////////////////////
 // Argument stash
 ////////////////////////////////////////////////////////////////////////////////
 thread_local ArgumentStash ArgumentStash::stash;

 void ArgumentStash::stashIntListElem(
     const std::string& arg_name,
     size_t size,
     size_t idx,
     const Variable& var) {
   // TODO: check type?
   if (!isTracing())
     return;
   auto& list_trace = stash.intlists.emplace(arg_name, size).first->second;
   AT_ASSERT(size == list_trace.size());
   AT_ASSERT(idx < list_trace.size());
   AT_ASSERT(list_trace[idx] == nullptr);

   Value* ten = getValueTrace(var);
   auto& g = *ten->owningGraph();
   WithInsertPoint guard(ten->node()->next());
   auto prim = g.insert(prim::Int, {ten});
   list_trace[idx] = prim;
 }

 void ArgumentStash::stashValue(
     const std::string& arg_name,
     size_t idx,
     const Variable& var,
     const TypePtr& type) {
   if (!isTracing())
     return;

   Value* ten = getValueTrace(var);
   WithInsertPoint guard(ten->node()->next());
   auto& g = *ten->owningGraph();

   if (type == IntType::get()) {
     ten = g.insert(prim::Int, {ten});
   } else if (type == FloatType::get()) {
     ten = g.insert(prim::Float, {ten});
   }

   stash.values.emplace(arg_name, ten);
 }

 ////////////////////////////////////////////////////////////////////////////////
 // Stack trace recording
 ////////////////////////////////////////////////////////////////////////////////
 // no python present so we just do not record source information
 void defaultRecordSourceLocation(Node* n) {}
 std::atomic<decltype(&defaultRecordSourceLocation)> record_source_location(
     defaultRecordSourceLocation);
 void recordSourceLocation(Node* n) {
   return record_source_location.load()(n);
 }
 void setRecordSourceLocation(void (*v)(Node*)) {
   record_source_location.store(v);
 }

 void defaultWarn(const std::string& str) {
   AT_WARN(str);
 }
 std::atomic<warn_fn_type> warn_callback{defaultWarn};

 const char* WARN_PYTHON_DATAFLOW =
     " might cause the trace to be incorrect. We can't record the data flow of "
     "Python values, so this value will be treated as a constant in the future. "
     "This means that the trace might not generalize to other inputs!";
 const char* WARN_CONSTRUCTOR =
     " results are registered as constants in the trace. You can safely ignore this "
     "warning if you use this function to create tensors out of constant variables "
     "that would be the same every time you call this function. In any other case, "
     "this might cause the trace to be incorrect.";
 const char* WARN_RESIZE =
     " can't be represented in the JIT at the moment, so we won't connect any uses of "
     "this value with its current trace. If you happen to use it again, it will show "
     "up as a constant in the graph.";

 // XXX: _kind can be a nullptr
 void _do_warn(const char* _reason, const char* _kind) {
   std::string reason{_reason};
   std::string kind{_kind ? _kind : ""};
   std::ostringstream s;
   s << reason << kind;
   warn_callback.load()(s.str());
 }

 void setWarn(warn_fn_type fn) {
   warn_callback.store(fn);
 }

 } // namespace tracer
 } // namespace jit
 } // namespace torch
	#include <torch/csrc/jit/tracer.h>

	#include <c10/util/Exception.h>
	#include <torch/csrc/autograd/engine.h>
	#include <torch/csrc/autograd/function.h>
	#include <torch/csrc/autograd/variable.h>
	#include <torch/csrc/jit/passes/dead_code_elimination.h>
	#include <torch/csrc/jit/passes/remove_expands.h>

	#include <memory>
	#include <sstream>
	#include <string>

	namespace torch {
	namespace jit {
	namespace tracer {

	////////////////////////////////////////////////////////////////////////////////
	// Recording the traces
	////////////////////////////////////////////////////////////////////////////////
	namespace detail {

	template <typename T>
	void genericAddInput(Node* n, T value) {
	Value* v = n->owningGraph()->insertConstant(value);
	recordSourceLocation(v->node());
	n->addInput(v);
	}

	template <typename T>
	void badArgType(const T& v) {
	AT_ERROR(
	"Found an unsupported argument type in the JIT tracer: ",
	c10::demangle_type<T>(),
	". File a bug report.");
	}

	thread_local std::shared_ptr<TracingState> tracing_state;

	} // namespace detail

	TORCH_API std::function<void()> pauseTracing() {
	// NOLINTNEXTLINE
	std::shared_ptr<tracer::TracingState> state = getTracingState();
	tracer::setTracingState(nullptr);

	return [state]() { tracer::setTracingState(state); };
	}

	void delValueTrace(const Variable& var) {
	AT_ASSERT(var.defined());
	auto& env_stack = getTracingState()->env_stack;
	for (size_t i = 0; i < env_stack.size(); ++i) {
	auto& value_map = env_stack.at(env_stack.size() - 1 - i).value_map;

	auto it = value_map.find(var);
	if (it == value_map.end()) {
	continue;
	}
	value_map.erase(it);
	}
	getTracingState()->env_stack.back().value_map.erase(var);
	}

	// Given a variable 'var', return the 'node' which represents the instruction
	// which computes the value of this variable in the IR.
	// Here, we interpret untraced variables as constants that are just embedded
	// in the graph. This is useful to handle code which does things like this
	// (from torch.autograd.variable, now moved to C++):
	//
	// def mm(self, matrix):
	// output = Variable(self.data.new(self.data.size(0), matrix.data.size(1)))
	// return Addmm.apply(output, self, matrix, 0, 1, True)
	//
	// Here, mm fakes up a dummy variable with uninitialized data to do an inplace
	// update on, but subsequently ignores it because the alpha scaling factor is
	// zero. This is one of the cases where a Variable can be created inside of a
	// trace, and if we treat it as a constant, everything will work out.
	Value* getValueTrace(const IValue& var) {
	auto& state = getTracingState();
	auto& env_stack = getTracingState()->env_stack;

	if (var.isTensor()) {
	auto ten = var.toTensor();
	if (!ten.defined()) {
	Node* n = state->graph->createUndefined();
	return state->graph->insertNode(n)->output();
	}
	for (size_t i = 0; i < env_stack.size(); ++i) {
	auto& value_map = env_stack.at(env_stack.size() - 1 - i).value_map;
	auto it = value_map.find(ten);
	if (it == value_map.end()) {
	continue;
	}
	if (!it->second->hasUniqueName()) {
	auto unique_name = getTracingState()->lookup_var_name_fn(ten);
	if (!unique_name.empty()) {
	it->second->setUniqueName(unique_name);
	}
	}
	return it->second;
	}

	// Didn't find it. Bake in a constant
	Value* constant = state->graph->insertConstant(ten);
	recordSourceLocation(constant->node());
	constant->inferTypeFrom(ten);
	auto it = env_stack.back().value_map.find(ten);
	it = env_stack.back().value_map.emplace_hint(it, ten, constant);
	return it->second;
	} else if (var.isFuture()) {
	auto fut = var.toFuture();
	for (size_t i = 0; i < env_stack.size(); ++i) {
	auto& future_map = env_stack.at(env_stack.size() - 1 - i).future_map;
	auto it = future_map.find(fut);
	if (it == future_map.end()) {
	continue;
	}
	return it->second;
	}

	std::ostringstream oss;
	oss << "Tried to trace Future that the tracer was not aware of.";
	throw std::runtime_error(oss.str());
	} else {
	std::ostringstream oss;
	oss << "Unknown type used in value trace lookup!";
	throw std::runtime_error(oss.str());
	}
	}

	// allow tracing of tuples passed to List[Tensor] or Tuple[Tensor...] arguments
	// One might merge getValueTrace and getNestedValueTrace after checking that
	// casting to IValue instead of Variable is OK
	Value* getNestedValueTrace(const IValue& v) {
	auto& state = getTracingState();
	if (v.isTensorList()) {
	return state->graph
	->insertNode(state->graph->createList(
	DynamicType::get(),
	fmap(
	v.toTensorListRef(),
	[](const IValue& val) { return getNestedValueTrace(val); })))
	->output();
	} else if (v.isTuple()) {
	return state->graph
	->insertNode(state->graph->createTuple(fmap(
	v.toTuple()->elements(),
	[](const IValue& val) { return getNestedValueTrace(val); })))
	->output();
	}
	return getValueTrace(v.toTensor());
	}

	Value* getOutputTrace(
	const std::shared_ptr<TracingState>& state,
	const Variable& var) {
	if (!var.defined()) {
	Node* n = state->graph->createUndefined();
	return state->graph->insertNode(n)->output();
	}

	auto& value_map = getTracingState()->env_stack.back().value_map;
	auto it = value_map.find(var);
	if (it == value_map.end()) {
	std::ostringstream os;
	os << "output of traced region did not have observable "
	<< "data dependence with trace inputs; this probably indicates your program "
	<< "cannot be understood by the tracer.";
	throw std::runtime_error(os.str());
	}
	return it->second;
	}

	Value* getNestedOutputTrace(
	const std::shared_ptr<TracingState>& state,
	const IValue& iv) {
	if (iv.isTensor()) {
	return getOutputTrace(state, iv.toTensor());
	} else if (iv.isTuple()) {
	const auto& elems = iv.toTuple()->elements();
	auto tuple_node = state->graph->createTuple(
	fmap(elems, [&state](const IValue& iv) {
	return getNestedOutputTrace(state, iv);
	}));
	state->graph->insertNode(tuple_node);
	return tuple_node->output();
	} else {
	AT_ERROR(
	"Only tensors or tuples of tensors can be output from traced functions");
	}
	}

	// Start tracing, treating 'inputs' as inputs to the trace, which can be
	// varied on subsequent invocations of the trace. Any other variables
	// will be treated as constants.
	std::pair<std::shared_ptr<TracingState>, Stack> enter(Stack inputs) {
	if (isTracing()) {
	AT_ERROR("Tracing can't be nested");
	}
	auto state = std::make_shared<TracingState>();
	setTracingState(state);
	// XXX: this function mutates input
	const std::function<IValue(IValue, TypePtr, Value*)> add_input =
	[&](IValue input, TypePtr type, Value* value) -> IValue {
	value->setType(type);
	if (type->isSubtypeOf(DynamicType::get())) {
	auto input_tensor = input.toTensor();
	auto name = Variable(input_tensor).name();
	auto& value_map = state->env_stack.back().value_map;
	if (value_map.find(input_tensor) != value_map.end()) {
	input_tensor = input_tensor.view(input_tensor.sizes());
	}
	value->setUniqueName(name);
	value_map[input_tensor] = value;
	return input_tensor;
	} else if (auto tuple_type = type->cast<TupleType>()) {
	auto unpack_node =
	state->graph->insertNode(state->graph->createTupleUnpack(value));
	auto elem_values = unpack_node->outputs();
	auto elem_types = tuple_type->elements();
	Stack elems = input.toTuple()->elements();
	size_t num_elems = elems.size();
	AT_ASSERT(
	elem_values.size() == num_elems && elem_types.size() == num_elems);
	for (size_t i = 0; i < num_elems; ++i) {
	elems[i] = add_input(elems[i], elem_types[i], elem_values[i]);
	}
	return Tuple::create(std::move(elems));
	} else {
	AT_ERROR(
	"Only tensors or tuples of tensors can be inputs to traced functions");
	}
	};
	for (IValue& input : inputs) {
	input = add_input(
	input, incompleteInferTypeFrom(input), state->graph->addInput());
	}
	return std::make_pair(state, inputs);
	}

	// Exit a trace, treating 'outputs' as the outputs of the trace. These
	// are the variables whose values will be computed upon subsequent
	// invocations of the trace.
	void exit(const Stack& outputs) {
	auto& state = getTracingState();
	size_t i = 0;
	for (auto& output : outputs) {
	state->graph->registerOutput(getNestedOutputTrace(state, output));
	i++;
	}
	setTracingState(nullptr);
	}

	// Abort tracing. Used to reset the state in case of errors.
	void abandon() {
	setTracingState(nullptr);
	}

	void setValueTrace(const IValue& v, Value* value) {
	if (v.isTensor()) {
	auto var = v.toTensor();
	AT_ASSERT(var.defined());
	getTracingState()->env_stack.back().value_map[var] = value;
	} else if (v.isTensorList()) {
	auto& outputs = v.toTensorList()->elements();
	auto graph = getTracingState()->graph;
	Node* unpack_node =
	graph->insertNode(graph->createListUnpack(value, outputs.size()));
	for (size_t i = 0; i < outputs.size(); ++i) {
	setValueTrace(outputs[i], unpack_node->outputs()[i]);
	}
	} else if (v.isTuple()) {
	auto& outputs = v.toTuple()->elements();
	auto graph = getTracingState()->graph;
	Node* unpack_node = graph->insertNode(graph->createTupleUnpack(value));
	for (size_t i = 0; i < outputs.size(); ++i) {
	setValueTrace(outputs[i], unpack_node->outputs()[i]);
	}
	} else if (v.isGenericList()) {
	auto elements = v.toGenericListRef();
	auto graph = getTracingState()->graph;
	Node* unpack_node =
	graph->insertNode(graph->createListUnpack(value, elements.size()));
	for (size_t i = 0; i < elements.size(); ++i) {
	setValueTrace(elements[i], unpack_node->outputs()[i]);
	}
	} else if (v.isFuture()) {
	auto fut = v.toFuture();
	getTracingState()->env_stack.back().future_map[fut] = value;
	} else {
	std::ostringstream os;
	os << "Tracer cannot set value trace for type " << v.tagKind() << ". "
	<< "Supported types are tensor, tensor list, and tuple of tensors.";
	throw std::runtime_error(os.str());
	}
	}

	void addInputs(Node* n, const char* name, int64_t value) {
	using ArgumentStash = jit::tracer::ArgumentStash;
	if (ArgumentStash::hasValue(name)) {
	Value* v = ArgumentStash::popValue(name);
	n->addInput(v);
	} else {
	detail::genericAddInput(n, value);
	}
	}

	void addInputs(Node* n, const char* name, c10::optional<int64_t> value) {
	if (value) {
	detail::genericAddInput(n, *value);
	} else {
	Graph* g = n->owningGraph();
	Value* none = g->insertNode(g->createNone(IntType::get()))->output();
	n->addInput(none);
	}
	}
	void addInputs(Node* n, const char* name, bool value) {
	detail::genericAddInput(n, value);
	}
	void addInputs(Node* n, const char* name, double value) {
	detail::genericAddInput(n, value);
	}
	void addInputs(Node* n, const char* name, const at::Scalar& value) {
	detail::genericAddInput(n, value);
	}
	void addInputs(
	Node* n,
	const char* name,
	const c10::optional<at::Scalar>& value) {
	if (value) {
	detail::genericAddInput(n, *value);
	} else {
	Graph* g = n->owningGraph();
	Value* none = g->insertNode(g->createNone(NumberType::get()))->output();
	n->addInput(none);
	}
	}
	void addInputs(Node* n, const char* name, const std::string& value) {
	detail::genericAddInput(n, value);
	}
	void addInputs(Node* n, const char* name, const at::Tensor& value) {
	n->addInput(getValueTrace(value));
	}
	void addInputs(Node* n, const char* name, const at::SparseTensorRef& value) {
	detail::badArgType(value);
	}
	void addInputs(Node* n, const char* name, at::Generator* value) {
	if (value) {
	detail::badArgType(value);
	}
	Graph* g = n->owningGraph();
	Value* undef_gen =
	g->insertNode(g->createNone(GeneratorType::get()))->output();
	n->addInput(undef_gen);
	}
	void addInputs(Node* n, const char* name, at::Device value) {
	detail::genericAddInput(n, value);
	}
	void addInputs(Node* n, const char* name, at::Layout value) {
	detail::genericAddInput(n, static_cast<int64_t>(value));
	}
	void addInputs(Node* n, const char* name, at::ScalarType value) {
	detail::genericAddInput(n, static_cast<int64_t>(value));
	}
	void addInputs(
	Node* n,
	const char* name,
	const c10::optional<at::ScalarType>& value) {
	if (value) {
	detail::genericAddInput(n, static_cast<int64_t>(*value));
	} else {
	Graph* g = n->owningGraph();
	Value* none = g->insertNode(g->createNone(IntType::get()))->output();
	n->addInput(none);
	}
	}

	void addInputs(Node* n, const char* name, at::TensorList value) {
	Graph* g = n->owningGraph();
	Node* list_node = g->insertNode(
	g->createList(DynamicType::get(), fmap(value, getValueTrace)));
	n->addInput(list_node->output());
	}

	void addInputs(Node* n, const char* name, const at::TensorOptions& options) {
	// [TensorOptions in script] - update this when you change how we schematize
	// TensorOptions
	addInputs(n, name, at::typeMetaToScalarType(options.dtype()));
	addInputs(n, name, options.layout());
	addInputs(n, name, options.device());
	}

	void addInputs(Node* n, const char* name, at::IntList value) {
	using ArgumentStash = jit::tracer::ArgumentStash;
	std::vector<Value*> info = ArgumentStash::hasIntList(name)
	? ArgumentStash::popIntList(name)
	: ArgumentStash::IntListTrace(value.size());

	auto& g = getTracingState()->graph;
	for (size_t i = 0; i < info.size(); ++i) {
	if (info[i] != nullptr)
	continue;
	info[i] = g->insertConstant(value[i]);
	recordSourceLocation(info[i]->node());
	}
	for (jit::Value* v : info) {
	if (v->type() != jit::IntType::get()) {
	throw std::runtime_error(
	"Type mismatch in setposattr for IntList. Check that your program "
	"is valid without tracing, and please file a bug report if it is.");
	}
	}
	n->addInput(
	g->insertNode(g->createList(jit::IntType::get(), info))->output());
	}

	void addInputs(Node* n, const char* name, const ArrayRef<double>& value) {
	AT_ERROR("Tracing float lists currently not supported!");
	}

	void addOutput(Node* node, const at::Tensor& output) {
	setOutput(node->addOutput(), output);
	}

	void setOutput(Value* value, const at::Tensor& output) {
	if (output.defined()) {
	value->inferTypeFrom(output);
	setValueTrace(autograd::as_variable_ref(output), value);
	}
	}

	void addOutput(Node* node, const std::vector<at::Tensor>& outputs) {
	Value* value = node->addOutput()->setType(ListType::ofTensors());
	Graph* graph = node->owningGraph();
	Node* unpack_node = graph->insertNode(
	graph->create(prim::ListUnpack, {value}, outputs.size()));
	for (size_t i = 0; i < outputs.size(); ++i) {
	Value* output_val = unpack_node->outputs()[i];
	output_val->inferTypeFrom(outputs[i]);
	setValueTrace(outputs[i], output_val);
	}
	}

	const std::shared_ptr<TracingState>& getTracingState() {
	return detail::tracing_state;
	}

	void setTracingState(std::shared_ptr<TracingState> state) {
	detail::tracing_state = std::move(state);
	}

	TracingState::TracingState()
	: env_stack{TracingEnvironmentFrame()}, graph(new Graph()) {}

	TracingState::~TracingState() = default;

	autograd::Variable getSizeOf(const autograd::Variable& var, int64_t dim) {
	auto& tracing_state = getTracingState();
	auto& graph = tracing_state->graph;

	auto size_var =
	autograd::make_variable(scalar_to_tensor(at::Scalar(var.size(dim))));
	auto* value = getValueTrace(var);
	auto dim_val = graph->insertConstant(dim);
	recordSourceLocation(dim_val->node());
	auto* node = graph->insertNode(graph->create(aten::size, {value, dim_val}));
	recordSourceLocation(node);
	node->output()->setType(jit::IntType::get());

	auto ten =
	graph->insertNode(graph->createNumToTensor(node->output()))->output();
	setValueTrace(size_var, ten);
	return size_var;
	}

	void ensureUniqueIfOutOfPlaced(
	const char* name,
	const at::Tensor& tensor) {
	auto& state = getTracingState();
	if (state && state->force_outplace == false) {
	// If we're not converting in-place ops to out-of-place, this check is
	// unnecessary
	return;
	}
	auto aliases = tensor.storage().use_count();
	if (isTracing() && aliases > 1) {
	std::stringstream ss;
	ss << "There are " << aliases
	<< " live references to the data region being modified when tracing in-place operator "
	<< name
	<< ". This might cause the trace to be incorrect, because all other views "
	<< "that also reference this data will not not reflect this change in the trace! "
	<< "On the other hand, if all other views use the same memory chunk, but are disjoint (e.g. "
	<< "are outputs of torch.split), this might still be safe.";
	warn(ss.str().c_str());
	}
	}

	////////////////////////////////////////////////////////////////////////////////
	// Argument stash
	////////////////////////////////////////////////////////////////////////////////
	thread_local ArgumentStash ArgumentStash::stash;

	void ArgumentStash::stashIntListElem(
	const std::string& arg_name,
	size_t size,
	size_t idx,
	const Variable& var) {
	// TODO: check type?
	if (!isTracing())
	return;
	auto& list_trace = stash.intlists.emplace(arg_name, size).first->second;
	AT_ASSERT(size == list_trace.size());
	AT_ASSERT(idx < list_trace.size());
	AT_ASSERT(list_trace[idx] == nullptr);

	Value* ten = getValueTrace(var);
	auto& g = *ten->owningGraph();
	WithInsertPoint guard(ten->node()->next());
	auto prim = g.insert(prim::Int, {ten});
	list_trace[idx] = prim;
	}

	void ArgumentStash::stashValue(
	const std::string& arg_name,
	size_t idx,
	const Variable& var,
	const TypePtr& type) {
	if (!isTracing())
	return;

	Value* ten = getValueTrace(var);
	WithInsertPoint guard(ten->node()->next());
	auto& g = *ten->owningGraph();

	if (type == IntType::get()) {
	ten = g.insert(prim::Int, {ten});
	} else if (type == FloatType::get()) {
	ten = g.insert(prim::Float, {ten});
	}

	stash.values.emplace(arg_name, ten);
	}

	////////////////////////////////////////////////////////////////////////////////
	// Stack trace recording
	////////////////////////////////////////////////////////////////////////////////
	// no python present so we just do not record source information
	void defaultRecordSourceLocation(Node* n) {}
	std::atomic<decltype(&defaultRecordSourceLocation)> record_source_location(
	defaultRecordSourceLocation);
	void recordSourceLocation(Node* n) {
	return record_source_location.load()(n);
	}
	void setRecordSourceLocation(void (v)(Node)) {
	record_source_location.store(v);
	}

	void defaultWarn(const std::string& str) {
	AT_WARN(str);
	}
	std::atomic<warn_fn_type> warn_callback{defaultWarn};

	const char* WARN_PYTHON_DATAFLOW =
	" might cause the trace to be incorrect. We can't record the data flow of "
	"Python values, so this value will be treated as a constant in the future. "
	"This means that the trace might not generalize to other inputs!";
	const char* WARN_CONSTRUCTOR =
	" results are registered as constants in the trace. You can safely ignore this "
	"warning if you use this function to create tensors out of constant variables "
	"that would be the same every time you call this function. In any other case, "
	"this might cause the trace to be incorrect.";
	const char* WARN_RESIZE =
	" can't be represented in the JIT at the moment, so we won't connect any uses of "
	"this value with its current trace. If you happen to use it again, it will show "
	"up as a constant in the graph.";

	// XXX: _kind can be a nullptr
	void _do_warn(const char* _reason, const char* _kind) {
	std::string reason{_reason};
	std::string kind{_kind ? _kind : ""};
	std::ostringstream s;
	s << reason << kind;
	warn_callback.load()(s.str());
	}

	void setWarn(warn_fn_type fn) {
	warn_callback.store(fn);
	}

	} // namespace tracer
	} // namespace jit
	} // namespace torch