#include "torch/csrc/jit/script/init.h" #include "torch/csrc/Device.h" #include "torch/csrc/Dtype.h" #include "torch/csrc/Layout.h" #include "torch/csrc/jit/import.h" #include "torch/csrc/jit/script/compiler.h" #include "torch/csrc/jit/python_tracer.h" #include "torch/csrc/jit/pybind_utils.h" #include "torch/csrc/jit/constants.h" #include "torch/csrc/jit/passes/to_batch.h" #include "torch/csrc/jit/function_schema.h" #include "torch/csrc/jit/script/parser.h" #include #include #include #include #include #include #include #include #include namespace torch { namespace jit { namespace script { using ResolutionCallback = std::function; // The visibility attribute is to avoid a warning about storing a field in the // struct that has a different visibility (from pybind) than the struct. #ifdef _WIN32 #define VISIBILITY_HIDDEN #else #define VISIBILITY_HIDDEN __attribute__((visibility("hidden"))) #endif static std::string typeString(py::handle h) { return py::str(h.get_type().attr("__name__")); } inline std::shared_ptr toSimple(Value* v) { return std::make_shared(v); } // NB: This should be the single entry-point for instantiating a SugaredValue // from a Python object. If you are adding support for converting a new Python // type, *add it in this function's implementation*. std::shared_ptr toSugaredValue( py::object obj, Method& m, SourceRange loc, bool is_constant = false, bool is_submodule = false); struct VISIBILITY_HIDDEN PythonValue : public SugaredValue { PythonValue(py::object self) : self(std::move(self)) {} FunctionSchema getSchema(const size_t n_args, const size_t n_binders) { auto annotations = py::module::import("torch.jit.annotations"); auto signature = annotations.attr("get_signature")(self); std::vector args, rets; // We may mutate this if we can determine the number of args from Python // introspection. size_t actual_n_args = n_args; if (!signature.is_none()) { std::vector arg_types, ret_types; std::tie(arg_types, ret_types) = py::cast, std::vector>>(signature); args.reserve(arg_types.size()); size_t idx = 0; // Fake argument names by putting in the index for (auto &arg_type : arg_types) { args.push_back(Argument(std::to_string(idx++), std::move(arg_type), {}, {}, false)); } rets.reserve(ret_types.size()); idx = 0; for (auto &ret_type : ret_types) { rets.push_back(Argument(std::to_string(idx++), std::move(ret_type), {}, {}, false)); } } else { // Create a default signature using what information we have // First see if we can introspect the number of function parameters // irrespective of the presence of explicit type annotations auto num_params = annotations.attr("get_num_params")(self); if (!num_params.is_none()) { // Return a signature with the correct number of params according to the // Python function. The error handling in call() will catch any mismatch // later. actual_n_args = py::cast(num_params); } // Construct the default signature: all arguments and returns will be // DynamicType args.reserve(actual_n_args); for (size_t i=0; i < actual_n_args; ++i) { args.push_back(Argument(std::to_string(i), DynamicType::get(), {}, {}, false)); } rets.reserve(n_binders); for (size_t i = 0; i < n_binders; ++i) { rets.push_back(Argument(std::to_string(i), DynamicType::get(), {}, {}, false)); } } return FunctionSchema("", std::move(args), std::move(rets)); } // call it like a function, e.g. `outputs = this(inputs)` virtual std::shared_ptr call(SourceRange loc, Method & m, at::ArrayRef inputs_, at::ArrayRef attributes, size_t n_binders) override { auto inputs = toValues(*m.graph(), inputs_); auto schema = getSchema(inputs.size(), n_binders); std::stringstream failure_messages; at::optional> all_inputs = tryMatchSchema(schema, loc, *m.graph(), inputs_, attributes, failure_messages, /*conv_tensor_to_num*/true); if (!all_inputs) throw ErrorReport(loc) << failure_messages.str(); // Release the function object so we can wrap it in a PythonOp py::object func = self; std::string cconv(inputs.size(), 't'); Node* new_node = m.graph()->insertNode(m.graph()->createPythonOp( THPObjectPtr(func.release().ptr()), cconv, {})); new_node->setSourceLocation(std::make_shared(loc)); for(auto &i : *all_inputs) new_node->addInput(i); // This is really dumb, but relaxing the constraints on return types would // require us to change the implementation of PythonOps in the interpreter. // Note that this effectively makes the return type of Tuple[Tensor] and Tensor // equivalent, but the PythonOp impl ends with an optional tuple unpack, so we need // to do it. for (auto & ret_arg : schema.returns) { if (!ret_arg.type->isSubtypeOf(DynamicType::get())) { throw ErrorReport(loc) << "Python functions can currently only return Tensors"; } } std::vector outputs; for(size_t i = 0; i < schema.returns.size(); ++i) outputs.push_back(new_node->addOutput()); return std::make_shared(packOutputs(*m.graph(), outputs)); } virtual std::shared_ptr attr(SourceRange loc, Method & m, const std::string& field) override; virtual std::string kind() const override { std::stringstream ss; ss << "python value of type '" << typeString(self) << "'"; return ss.str(); } protected: py::object getattr(SourceRange loc, const std::string& name) { try { return py::getattr(self, name.c_str()); } catch (py::error_already_set& e) { throw ErrorReport(loc) << "object has no attribute " << name; } } py::object self; }; // A Python value respresenting a custom op namespace object, like // `torch.ops.my_namespace`. When accessing an attribute, it is assumed that it // is the function under that custom op namespace we want to call, and a // `BuiltinFunction` value is returned for it. struct VISIBILITY_HIDDEN CustomOpNamespaceValue : public PythonValue { explicit CustomOpNamespaceValue(py::object obj) : PythonValue(std::move(obj)) {} std::shared_ptr attr( SourceRange loc, Method& m, const std::string& field) override { py::object member = getattr(loc, field); const auto op_namespace = py::cast(self.attr("name")); // The symbol name is the op namespace + the op (function) name, which is // being accessed as the `field` here. auto symbol = Symbol::fromQualString(op_namespace + "::" + field); return std::make_shared( std::move(symbol), at::nullopt); } }; // The `torch.ops` value. All it does is create `CustomOpNamespaceValue` // objects when accessing attributes under it, e.g. `torch.ops.my_namespace`. struct VISIBILITY_HIDDEN CustomOpsValue : public PythonValue { explicit CustomOpsValue(py::object obj) : PythonValue(std::move(obj)) {} std::shared_ptr attr( SourceRange loc, Method& m, const std::string& field) override { py::object member = getattr(loc, field); return std::make_shared(member); } }; struct VISIBILITY_HIDDEN PythonModuleValue : public PythonValue { explicit PythonModuleValue(py::object mod) : PythonValue(mod) {} std::shared_ptr attr( SourceRange loc, Method& m, const std::string& field) override { py::object member = getattr(loc, field); return toSugaredValue(member, m, loc); } }; struct VISIBILITY_HIDDEN BuiltinPythonModuleValue : public PythonModuleValue { explicit BuiltinPythonModuleValue(py::object mod) : PythonModuleValue(mod) {} std::shared_ptr attr(SourceRange loc, Method & m, const std::string& field) override { // We support calling functions and using type/layout/device constants // on the torch builtin modules py::object member = getattr(loc, field); if (py::isinstance(member)) { return std::make_shared( Symbol::aten(field), at::nullopt); } else if (field == "ops") { return std::make_shared(member); } return toSugaredValue(member, m, loc, /*is_constant =*/true); } }; bool isBuiltinModule(py::object obj) { // XXX: these can't be static, or they will be destructed after the Python interpreter // exits and that generally sounds like a bad idea py::object torch = py::module::import("torch"); py::object functional = py::module::import("torch.nn.functional"); return obj.is(torch) || obj.is(functional); } struct VISIBILITY_HIDDEN ConstantPythonTupleValue : public PythonValue { explicit ConstantPythonTupleValue(py::object tup) : PythonValue(tup) {} std::vector> asTuple(SourceRange loc, Method& m) override { py::tuple tup = self; std::vector> result; result.reserve(tup.size()); for (size_t i = 0; i < tup.size(); ++i) { result.push_back(toSugaredValue(tup[i], m, loc, true)); } return result; } }; std::shared_ptr PythonValue::attr(SourceRange loc, Method & m, const std::string& field) { // We generally don't want to allow traversing arbitrary Python objects, but we // make an exception for traversing modules because we want to be access // torch, torch.nn.functional, and the functions they expose. py::object member = getattr(loc, field); return toSugaredValue(member, m, loc); } // defines how modules/methods behave inside the script subset. // for now this does not have any interaction with python. // in the future, we will add the ability to resolve `self.foo` to python // {functions, modules, contants} so this SugaredValue is defined here // anticipating we will eventually need to replace Module with a py::object // holding the actual nn.Module class. // defines how a method obtained from a module behaves in script struct MethodValue : public SugaredValue { MethodValue(std::shared_ptr module, Method& method) : module(std::move(module)) //insurance that method stays alive , method(method) {} std::string kind() const override { return "method"; } virtual std::shared_ptr call(SourceRange loc, Method & caller, at::ArrayRef inputs, at::ArrayRef attributes, size_t n_binders) override { return std::make_shared(packOutputs(*caller.graph(), caller.emit_call_to(loc, method, inputs, attributes))); } private: std::shared_ptr module; Method& method; }; struct ModuleValue : public SugaredValue { ModuleValue(std::shared_ptr module) : module(std::move(module)) {} virtual std::string kind() const override { return "module"; } // select an attribute on it, e.g. `this.field` virtual std::shared_ptr attr(SourceRange loc, Method & m, const std::string& field) override { if(NamedModule* v = module->find_module(field)) { return std::make_shared(v->module); } else if(Method* v = module->find_method(field)) { return std::make_shared(module, *v); } else if(NamedParameter* v = module->find_parameter(field)) { return std::make_shared(m.get_or_add_parameter(v->slot())); } // This can also be a call to a non-script module, or a plain // python method. If so return this as a python value. py::object py_module = py::cast(module); if(py::object attr = py::getattr(py_module, field.c_str(), py::none())) { if (py::isinstance(attr) || py::isinstance(attr, py::module::import("torch.nn").attr("Module")) || py_module.attr("_constants_set").contains(field.c_str())) { return toSugaredValue(attr, m, loc, true); } else { throw ErrorReport(loc) << "attribute '" << field << "' of type '" << typeString(attr) << "' is not usable in a script method (did you forget to add it __constants__?)"; } } throw ErrorReport(loc) << "module has no attribute '" << field << "'"; } // call module.forward virtual std::shared_ptr call(SourceRange loc, Method & caller, at::ArrayRef inputs, at::ArrayRef attributes, size_t n_binders) override { return attr(loc, caller, "forward")->call(loc, caller, inputs, attributes, n_binders); } virtual std::vector> asTuple(SourceRange loc, Method& m) override { py::object py_module = py::cast(module); if(!py::isinstance(py_module, py::module::import("torch.jit").attr("_ConstModuleList"))) return SugaredValue::asTuple(loc, m); std::vector> result; for(py::handle module : py_module) { py::object obj = py::reinterpret_borrow(module); result.push_back(toSugaredValue( obj, m, loc, /*is_constant =*/false, /*is_submodule =*/true)); } return result; } private: std::shared_ptr module; }; std::shared_ptr toSugaredValue( py::object obj, Method& m, SourceRange loc, bool is_constant, bool is_submodule) { // directly create SimpleValues when possible, because they are first-class // and can be re-assigned. Otherwise, this would be invalid: // f = python_constant // while ... // f = f + 1 auto& g = *m.graph(); if (is_constant) { if (py::isinstance(obj)) { return toSimple(g.insertConstant(py::cast(obj), loc)); } else if (py::isinstance(obj)) { return toSimple(g.insertConstant(py::cast(obj), loc)); } else if (py::isinstance(obj)) { return toSimple(g.insertConstant(py::cast(obj), loc)); } else if (THPDevice_Check(obj.ptr())) { auto device = (THPDevice*)obj.ptr(); std::vector v = {static_cast(device->device.type()), device->device.index()}; return toSimple(g.insertConstant(std::move(v))); } else if (THPLayout_Check(obj.ptr())) { auto layout = (THPLayout*)obj.ptr(); const auto v = static_cast(layout->layout); return toSimple(g.insertConstant(v, loc)); } else if (THPDtype_Check(obj.ptr())) { auto dtype = (THPDtype*)(obj.ptr()); const auto v = static_cast(dtype->scalar_type); return toSimple(g.insertConstant(v, loc)); } else if (py::isinstance(obj)) { return std::make_shared(obj); } } if (py::isinstance(obj)) { auto mod = py::cast>(obj); // In the case that this Python object is not a submodule, inline *ONLY // PURE* ScriptModules. This allows us to call arbitrary @script functions // within a scripting context while still enforcing that parameters from // stateful submodules are properly accounted for. if (!is_submodule && mod->get_parameters().size() != 0) { throw ErrorReport() << "Attempted to inline a Module with parameters. " "Stateful modules to be inlined must be submodules of the callee."; } return std::make_shared(mod); } else if (py::isinstance(obj)) { if (isBuiltinModule(obj)) { return std::make_shared(obj); } else { return std::make_shared(obj); } } return std::make_shared(obj); } py::object unpackVariableTensorList(std::vector outputs) { // if we don't tell pybind these are variables it chokes on the // conversion. // TODO: fix conversions to be sane and make sure this works. if (outputs.size() == 0) { return py::none(); } else if (outputs.size() == 1) { return py::cast(autograd::as_variable_ref(outputs[0])); } else { py::tuple tuple(outputs.size()); for(size_t i = 0; i < outputs.size(); i++) { tuple[i] = py::cast(autograd::as_variable_ref(outputs[i])); } return tuple; } } static void gatherParametersAndBuffers(std::vector & values, const Module & m) { for(auto & param : m.get_parameters()) { values.push_back(param->slot()); } for(const auto & sub : m.get_modules()) { gatherParametersAndBuffers(values, *sub->module); } } Resolver pythonResolver(ResolutionCallback rcb) { return [=](const std::string& name, Method& m, const SourceRange& loc) -> std::shared_ptr { AutoGIL ag; py::object obj = rcb(name); if (obj.is(py::none())) { return nullptr; } return toSugaredValue(obj, m, loc); }; } void initJitScriptBindings(PyObject* module) { auto m = py::handle(module).cast(); // torch.jit.ScriptModule is a subclass of this C++ object. // Methods here are prefixed with _ since they should not be // public. py::class_>(m, "ScriptModule") .def(py::init<>()) .def("save", &Module::save) .def("_load", [](const std::shared_ptr module, const std::string& filename) { ImportIRModule(module, filename); }) .def("_set_optimized", &Module::set_optimized) .def( "_define", [](std::shared_ptr m, const std::string& script, ResolutionCallback rcb, bool has_self) { auto self = has_self ? std::make_shared(m) : nullptr; return defineMethodsInModule(*m, script, pythonResolver(rcb), self); }) .def("_create_methods", [](std::shared_ptr m, const std::vector& defs, const std::vector& rcbs) { std::vector resolvers; for(auto & callback : rcbs) { resolvers.push_back(pythonResolver(callback)); } defineMethodsInModule( *m, defs, resolvers, std::make_shared(m)); }) .def("_get_method", [](Module& self, const std::string& name) -> const Method& { return self.get_method(name); }, py::return_value_policy::reference_internal) .def("_register_parameter", &Module::register_parameter) .def("_register_module", &Module::register_module) .def("_set_parameter", &Module::set_parameter) .def("_get_parameter", &Module::get_parameter) .def("_get_module", &Module::get_module) .def("_get_modules", [](Module& self) -> py::tuple { auto & modules = self.get_modules(); py::tuple result(modules.size()); for(size_t i = 0; i < modules.size(); ++i) { auto & item = modules[i]; result[i] = std::make_pair(item.key, item.value); } return result; }) .def("_get_parameters", [](Module& self) -> py::tuple { auto & parameters = self.get_parameters(); py::tuple result(parameters.size()); for(size_t i = 0; i < parameters.size(); ++i) { auto & p = parameters[i]; py::tuple r(3); result[i] = std::make_tuple( p.key, autograd::as_variable_ref(*p->slot()), p->is_buffer); } return result; }) .def("_has_parameter", [](Module& self, const std::string& name) { if(auto r = self.find_parameter(name)) { return !r->is_buffer; } return false; }) .def("_has_buffer", [](Module& self, const std::string& name) { if(auto r = self.find_parameter(name)) { return r->is_buffer; } return false; }) .def("_has_module", [](Module& self, const std::string& name) { return bool(self.find_module(name)); }) .def("_has_method", [](Module& self, const std::string& name) { return bool(self.find_method(name)); }) .def("_method_names", [](Module& self) { using Item = torch::detail::OrderedDict>::Item; return fmap(self.get_methods(), [](const Item & item) { return (*item)->name(); }); }) .def("_create_method_from_graph", []( Module& self, const std::string& name, std::shared_ptr graph ){ std::vector parameters; self.create_method(name, std::move(graph), std::move(parameters)); }) .def("_create_method_from_trace", []( Module& self, const std::string& name, py::function func, py::tuple input_tuple) { // prereq: Module's buffers and parameters are unique // this was ensured in python before calling this function std::vector parameters; gatherParametersAndBuffers(parameters, self); Stack inputs = toStack(input_tuple); for(at::Tensor* param : parameters) { inputs.emplace_back(*param); } auto graph = tracer::createGraphByTracing(func, inputs, input_tuple.size()); self.create_method(name, std::move(graph), std::move(parameters)); }) .def("graph_for", [](Module& self, py::args args, py::kwargs kwargs) { if (self.find_method("forward")) { Method & m = self.get_method("forward"); return m.graph_for( createStackForSchema(m.getSchema(), std::move(args), std::move(kwargs))); } throw std::runtime_error("Attempted to call graph_for on a Module without a compiled forward()"); }) .def("get_debug_state", [](Module& self) { if (self.find_method("forward")) { Method & m = self.get_method("forward"); return m.getDebugState(); } throw std::runtime_error("Attempted to call get_debug_state on a Module without a compiled forward()"); }) .def("forward", [](Module& self, py::args args, py::kwargs kwargs) { // We implement this in C++ to avoid incurring the pybind11 dispatch // overhead twice: once to call into the method lookup for "forward" // and once to actually invoke the method. // // There is a thin wrapper on top of this method in the C++ version of // ScriptModule. return invokeScriptMethodFromPython(self.get_method("forward"), std::move(args), std::move(kwargs)); }); py::class_(m, "ScriptMethod", py::dynamic_attr()) .def("graph", [&](Method& self) { return self.graph(); }) .def("__call__", invokeScriptMethodFromPython) .def_property_readonly("graph", [](Method& m) { return m.graph(); }) .def("propagate_shapes", &Method::propagate_shapes) .def("propagate_and_assign_input_and_output_shapes", &Method::propagate_and_assign_input_and_output_shapes) .def("params", &Method::params) .def("graph_for", [](Method& self, py::args args, py::kwargs kwargs) { return self.graph_for(createStackForSchema(self.getSchema(), std::move(args), std::move(kwargs))); }) .def("forward_schema", [](Method &self, Def &def, bool is_method) { auto schema = extractSchemaFromDef(def, is_method); self.setSchema(schema); }) .def("pretty_print_schema", &Method::pretty_print_schema); m.def("_jit_script_compile", [](const Def &def, ResolutionCallback rcb) { return compileFunction(def, pythonResolver(rcb)); }); m.def("parse_type_comment", [](const std::string& comment) { Parser p(comment); return Decl(p.parseTypeComment(true)); }); m.def("merge_type_from_type_comment", &mergeTypesFromTypeComment); } } // namespace script } // namespace jit } // namespace torch