[jit] make clone works for interface type (#42121)

Summary: Pull Request resolved: https://github.com/pytorch/pytorch/pull/42121 This PR changes the Module API to allow register a module with module interface type, and therefore allows Module::clone works on the case where there's a module interface type being shared by two submodules. interface type will be shared by the new cloned instance in the same compilation unit bc it only contains a list of functionSchema, which does not involve any attributes compared to classType. fixes https://github.com/pytorch/pytorch/issues/41882 Test Plan: Imported from OSS Reviewed By: suo Differential Revision: D22781205 Pulled By: wanchaol fbshipit-source-id: f97f4b75970f0b434e38b5a1f778eda2c4e5109b
2026-05-14 20:57:59 +00:00 · 2020-07-31 10:21:43 -07:00 · 2020-07-31 10:21:43 -07:00 · a9e7e787f8
commit a9e7e787f8
parent 352e15f1a2
5 changed files with 185 additions and 5 deletions
--- a/test/cpp/jit/test_module_api.cpp
+++ b/test/cpp/jit/test_module_api.cpp
@ -1,10 +1,47 @@
 #include <test/cpp/jit/test_base.h>
 #include <test/cpp/jit/test_utils.h>
+
+#include <ATen/core/qualified_name.h>
+#include <torch/csrc/jit/frontend/resolver.h>
+#include <torch/csrc/jit/serialization/import.h>
+#include <torch/csrc/jit/serialization/import_source.h>
 #include <torch/torch.h>

 namespace torch {
 namespace jit {

+static const auto moduleInterfaceSrc = R"JIT(
+class OneInterface(ModuleInterface):
+    def one(self, x: Tensor, y: Tensor) -> Tensor:
+        pass
+)JIT";
+
+static const std::vector<std::string> subModuleMethodsSrc = {R"JIT(
+def one(self, x: Tensor, y: Tensor) -> Tensor:
+    return self.attr * x + y + 1
+
+def forward(self, x: Tensor) -> Tensor:
+    return self.attr + x
+)JIT"};
+
+static const auto parentForward = R"JIT(
+def forward(self, x: Tensor) -> Tensor:
+    return self.subMod1.one(x, x) + self.subMod2.one(x, x)
+)JIT";
+
+static void import_libs(
+    std::shared_ptr<CompilationUnit> cu,
+    const std::string& class_name,
+    const std::shared_ptr<Source>& src,
+    const std::vector<at::IValue>& tensor_table) {
+  SourceImporter si(
+      cu,
+      &tensor_table,
+      [&](const std::string& name) -> std::shared_ptr<Source> { return src; },
+      /*version=*/2);
+  si.loadType(QualifiedName(class_name));
+}
+
 void testModuleClone() {
  auto cu = std::make_shared<CompilationUnit>();
  // creating child module
@ -34,6 +71,50 @@ void testModuleClone() {
  ASSERT_EQ(Module(p2.attr("c2").toObject()).attr(attr_name).toInt(), 3);
 }

+void testModuleCloneWithModuleInterface() {
+  auto cu = std::make_shared<CompilationUnit>();
+
+  // define a initial module with two submods share same interface
+  Module parentMod("parentMod", cu);
+  Module subMod1("subMod1", cu);
+  Module subMod2("subMod2", cu);
+
+  std::vector<at::IValue> constantTable;
+  import_libs(
+      cu,
+      "__torch__.OneInterface",
+      std::make_shared<Source>(moduleInterfaceSrc),
+      constantTable);
+
+  auto v1 = IValue(2);
+  subMod1.register_attribute("attr", IntType::get(), v1, false);
+
+  auto v2 = IValue(4);
+  subMod2.register_attribute("attr", IntType::get(), v2, false);
+
+  for (const std::string& method : subModuleMethodsSrc) {
+    subMod1.define(method, nativeResolver());
+    subMod2.define(method, nativeResolver());
+  }
+
+  parentMod.register_attribute(
+      "subMod1",
+      cu->get_interface("__torch__.OneInterface"),
+      subMod1._ivalue());
+  parentMod.register_attribute(
+      "subMod2",
+      cu->get_interface("__torch__.OneInterface"),
+      subMod2._ivalue());
+
+  parentMod.define(parentForward, nativeResolver());
+
+  Module clonedMod = parentMod.clone();
+
+  // clone will copy both type and data, therefore we'll have a
+  // different type
+  ASSERT_NE(clonedMod.type(), parentMod.type());
+}
+
 void testModuleCopy() {
  auto cu = std::make_shared<CompilationUnit>();
  auto cls = ClassType::create("foo.bar", cu, true);
--- a/test/cpp/jit/tests.h
+++ b/test/cpp/jit/tests.h
@ -75,6 +75,7 @@ namespace jit {
  _(ClassDerive)                       \
  _(SaveLoadTorchbind)                 \
  _(ModuleInterfaceSerialization)      \
+  _(ModuleCloneWithModuleInterface)    \
  _(ClassTypeAddRemoveAttr)            \
  _(Inliner)                           \
  _(LiteInterpreterAdd)                \
--- a/test/quantization/test_quantize_jit.py
+++ b/test/quantization/test_quantize_jit.py
@ -395,6 +395,80 @@ class TestQuantizeJitPasses(QuantizationTestCase):
        # for weight
        assert len(attrs_with_prefix(m.conv, '_observer_')) == 1

+    def test_insert_observers_interface(self):
+        @torch.jit.interface
+        class SubInterface(torch.nn.Module):
+            def addOne(self, inp) -> torch.Tensor:
+                pass
+
+        class Sub(torch.nn.Module):
+            def __init__(self):
+                super(Sub, self).__init__()
+                self.fc = torch.nn.Linear(5, 5)
+
+            def addOne(self, inp):
+                return self.fc(inp) + 1
+
+            def forward(self, x):
+                return self.addOne(x)
+
+        class M(torch.nn.Module):
+            def __init__(self):
+                super(M, self).__init__()
+                self.conv = torch.nn.Conv2d(3, 5, 3)
+                self.sub = Sub()
+
+            def forward(self, x):
+                return self.sub(self.conv(x))
+
+        m = torch.jit.script(M())
+        qconfig_dict = {'sub.conv': default_qconfig}
+        m = prepare_jit(m, qconfig_dict)
+
+    def test_insert_observers_interface_unshare_type(self):
+        @torch.jit.interface
+        class OperatorIf(nn.Module):
+            def forward(self, inp: torch.Tensor) -> torch.Tensor:
+                pass
+
+        class Operator(nn.Module):
+            def __init__(self, a):
+                super().__init__()
+                self.a = a
+
+            def forward(self, inp: torch.Tensor) -> torch.Tensor:
+                return self.a * (inp + self.a)
+
+        class Inner(nn.Module):
+            op: OperatorIf
+
+            def __init__(self, op):
+                super().__init__()
+                self.op = op
+
+            def forward(self, inp):
+                return self.op(inp)
+
+
+        class Outer(nn.Module):
+            def __init__(self):
+                super().__init__()
+                self.inner_a = Inner(Operator(1))
+                self.inner_b = Inner(Operator(3.0))
+
+            def forward(self, inp):
+                return self.inner_a(inp) + self.inner_b(inp)
+
+        qconfig_dict = {'inner_a': default_qconfig, 'inner_b': default_qconfig}
+
+        eager_model = Outer()
+        for tracing in [True, False]:
+            x = torch.rand(3)
+            script_model = get_script_module(eager_model, tracing, x)
+            # make sure it runs
+            prepare_jit(script_model, qconfig_dict)
+
+
    def test_insert_observers_child_qconfig(self):
        class Sub(torch.nn.Module):
            def __init__(self):
--- a/torch/csrc/jit/api/module.cpp
+++ b/torch/csrc/jit/api/module.cpp
@ -203,18 +203,29 @@ Module Module::clone_impl(
  size_t N = type()->numAttributes();
  for (size_t i = 0; i < N; ++i) {
    IValue s = _ivalue()->getSlot(i);
-    if (type()->getAttribute(i)->is_module()) {
+    std::string attr_name = type()->getAttributeName(i);
+    TypePtr attr_type = type()->getAttribute(i);
+    if (attr_type->is_module()) {
      const Module& orig = Module(s.toObject());
      Module cloned = orig.clone_impl(type_remap, inplace, memo);
      type_remap[orig.type()] = cloned.type();
-      r.register_module(type()->getAttributeName(i), cloned);
+      // NOTE: why do we need to manually setattr on object instead of using
+      // register_module here? because the attr can be a module interface
+      // type and hold a Module object still. register_module will not let us
+      // correctly set up the type for this attr, so we had to do this manually.
+      // In the case it's an interface type, the type will be shared by the new
+      // cloned instance in the same compilation unit bc it only contains a list
+      // of functionSchema
+      r.type()->addOrCheckAttribute(
+          attr_name, attr_type->cast<ClassType>() ? cloned.type() : attr_type);
+      r._ivalue()->setAttr(attr_name, cloned._ivalue());
    } else {
      // this adds new slot and creates a new attribute for the underlying type
      // if the type is not already cloned, otherwise it will only add a new
      // slot and typecheck
      r.register_attribute(
          type()->getAttributeName(i),
-          type()->getAttribute(i),
+          attr_type,
          // we'll deepcopy the IValue in non inplace option
          inplace ? s : s.deepcopy(memo),
          type()->is_parameter(i),
--- a/torch/csrc/jit/passes/quantization/insert_observers.cpp
+++ b/torch/csrc/jit/passes/quantization/insert_observers.cpp
@ -124,11 +124,24 @@ class ModuleCloneHelper {
    size_t N = type->numAttributes();
    for (size_t i = 0; i < N; ++i) {
      IValue s = module._ivalue()->getSlot(i);
-      if (type->getAttribute(i)->is_module()) {
+      std::string attr_name = type->getAttributeName(i);
+      TypePtr attr_type = type->getAttribute(i);
+      if (attr_type->is_module()) {
        const Module& orig = Module(s.toObject());
        Module cloned =
            clone_impl(orig, module_qconfig_map, type_remap, inplace, memo);
-        r.register_module(type->getAttributeName(i), cloned);
+
+        // NOTE: why do we need to manually setattr on object instead of using
+        // register_module here? because the attr can be a module interface
+        // type and hold a Module object still. register_module will not let us
+        // correctly set up the type for this attr, so we had to do this
+        // manually. In the case it's an interface type, the type will be shared
+        // by the new cloned instance in the same compilation unit bc it only
+        // contains a list of functionSchema
+        r.type()->addOrCheckAttribute(
+            attr_name,
+            attr_type->cast<ClassType>() ? cloned.type() : attr_type);
+        r._ivalue()->setAttr(attr_name, cloned._ivalue());
      } else {
        // we'll deepcopy the IValue in non inplace option
        r.register_attribute(