Changed to module subsequencing

pytorch · vmoens · Aug 10, 2022 · Jul 28, 2022 · Jul 28, 2022 · Jul 29, 2022
commit 974eb9750278ae673b54eb623b53a18d6fc416b6
diff --git a/test/test_tensordictmodules.py b/test/test_tensordictmodules.py
@@ -1542,42 +1542,66 @@ def test_submodule_sequence(self, functional):
         td_module = TensorDictSequence(td_module_1, td_module_2)
 
         if functional:
-            td_module, (params, buffers) = td_module.make_functional_with_buffers()
-            td_0 = TensorDict({"in": torch.randn(5, 3)}, [5])
-            td_module(td_0, params=params, buffers=buffers)
-            assert td_0.get("out").shape == torch.Size([5, 4])
             td_1 = TensorDict({"in": torch.randn(5, 3)}, [5])
-            td_module(
+            sub_seq_1 = td_module.select_subsequence(out_keys=["hidden"])
+            sub_seq_1, (params, buffers) = sub_seq_1.make_functional_with_buffers()
+            sub_seq_1(
                 td_1,
-                out_keys_filter=["hidden"],
                 params=params,
                 buffers=buffers,
             )
             assert "hidden" in td_1.keys()
             assert "out" not in td_1.keys()
             td_2 = TensorDict({"hidden": torch.randn(5, 2)}, [5])
-            td_module(
+            sub_seq_2 = td_module.select_subsequence(in_keys=["hidden"])
+            sub_seq_2, (params, buffers) = sub_seq_2.make_functional_with_buffers()
+            sub_seq_2(
                 td_2,
-                in_keys_filter=["hidden"],
                 params=params,
                 buffers=buffers,
             )
             assert "out" in td_2.keys()
             assert td_2.get("out").shape == torch.Size([5, 4])
         else:
-            td_0 = TensorDict({"in": torch.randn(5, 3)}, [5])
-            td_module(td_0)
-            assert td_0.get("out").shape == torch.Size([5, 4])
             td_1 = TensorDict({"in": torch.randn(5, 3)}, [5])
-            td_module(td_1, out_keys_filter=["hidden"])
+            sub_seq_1 = td_module.select_subsequence(out_keys=["hidden"])
+            sub_seq_1(td_1)
             assert "hidden" in td_1.keys()
             assert "out" not in td_1.keys()
             td_2 = TensorDict({"hidden": torch.randn(5, 2)}, [5])
-            td_module(td_2, in_keys_filter=["hidden"])
+            sub_seq_2 = td_module.select_subsequence(in_keys=["hidden"])
+            sub_seq_2(td_2)
             assert "out" in td_2.keys()
             assert td_2.get("out").shape == torch.Size([5, 4])
 
 
+def test_subsequence_weight_update():
+    td_module_1 = TensorDictModule(
+        nn.Linear(3, 2),
+        in_keys=["in"],
+        out_keys=["hidden"],
+    )
+    td_module_2 = TensorDictModule(
+        nn.Linear(2, 4),
+        in_keys=["hidden"],
+        out_keys=["out"],
+    )
+    td_module = TensorDictSequence(td_module_1, td_module_2)
+
+    td_1 = TensorDict({"in": torch.randn(5, 3)}, [5])
+    sub_seq_1 = td_module.select_subsequence(out_keys=["hidden"])
+    copy = sub_seq_1[0].module.weight.clone()
+
+    opt = torch.optim.SGD(td_module.parameters(), lr=0.1)
+    opt.zero_grad()
+    td_1 = td_module(td_1)
+    td_1["out"].mean().backward()
+    opt.step()
+
+    assert not torch.allclose(copy, sub_seq_1[0].module.weight)
+    assert torch.allclose(td_module[0].module.weight, sub_seq_1[0].module.weight)
+
+
 if __name__ == "__main__":
     args, unknown = argparse.ArgumentParser().parse_known_args()
     pytest.main([__file__, "--capture", "no", "--exitfirst"] + unknown)
diff --git a/torchrl/modules/tensordict_module/sequence.py b/torchrl/modules/tensordict_module/sequence.py
@@ -195,44 +195,57 @@ def _split_param(
             out.append(param_list[a:b])
         return out
 
-    def forward(
-        self,
-        tensordict: TensorDictBase,
-        in_keys_filter=None,
-        out_keys_filter=None,
-        tensordict_out=None,
-        **kwargs,
-    ) -> TensorDictBase:
+    def select_subsequence(
+        self, in_keys: Iterable[str] = None, out_keys: Iterable[str] = None
+    ) -> "TensorDictSequence":
+        """
+        Returns a new TensorDictSequence with only the modules that are necessary to compute
+        the given output keys with the given input keys.
+
+        Args:
+            in_keys: input keys of the subsequence we want to select
+            out_keys: output keys of the subsequence we want to select
 
-        # Filter modules to avoid calling modules that don't require the desired in_keys or out keys.
-        if in_keys_filter is None:
-            in_keys_filter = deepcopy(self.in_keys)
-        if out_keys_filter is None:
-            out_keys_filter = deepcopy(self.out_keys)
+        Returns:
+            A new TensorDictSequence with only the modules that are necessary acording to the given input and output keys.
+        """
+        if in_keys is None:
+            in_keys = deepcopy(self.in_keys)
+        if out_keys is None:
+            out_keys = deepcopy(self.out_keys)
         id_to_keep = set([i for i in range(len(self.module))])
         for i, module in enumerate(self.module):
-            if all(key in in_keys_filter for key in module.in_keys):
-                in_keys_filter.extend(module.out_keys)
+            if all(key in in_keys for key in module.in_keys):
+                in_keys.extend(module.out_keys)
             else:
                 id_to_keep.remove(i)
         for i, module in reversed(list(enumerate(self.module))):
             if i in id_to_keep:
-                if any(key in out_keys_filter for key in module.out_keys):
-                    out_keys_filter.extend(module.in_keys)
+                if any(key in out_keys for key in module.out_keys):
+                    out_keys.extend(module.in_keys)
                 else:
                     id_to_keep.remove(i)
         id_to_keep = sorted(list(id_to_keep))
 
         modules = [self.module[i] for i in id_to_keep]
 
-        in_keys, _ = self._compute_in_and_out_keys(modules)
+        return TensorDictSequence(*modules)
 
-        if not all(key in tensordict.keys() for key in in_keys):
+    def forward(
+        self,
+        tensordict: TensorDictBase,
+        tensordict_out=None,
+        **kwargs,
+    ) -> TensorDictBase:
+
+        if not all(key in tensordict.keys() for key in self.in_keys):
 
             raise ValueError(
-                f"Not all in_keys found in input TensorDict. missing keys:{set(in_keys) - set(tensordict.keys())}"
+                f"Not all in_keys found in input TensorDict. missing keys:{set(self.in_keys) - set(tensordict.keys())}"
             )
 
+        # Filter modules to avoid calling modules that don't require the desired in_keys or out keys
+
         if "params" in kwargs and "buffers" in kwargs:
             param_splits = self._split_param(kwargs["params"], "params")
             buffer_splits = self._split_param(kwargs["buffers"], "buffers")
@@ -241,11 +254,8 @@ def forward(
                 for key, item in kwargs.items()
                 if key not in ("params", "buffers")
             }
-            param_splits = [param_splits[i] for i in id_to_keep]
-            buffer_splits = [buffer_splits[i] for i in id_to_keep]
-
             for i, (module, param, buffer) in enumerate(
-                zip(modules, param_splits, buffer_splits)
+                zip(self.module, param_splits, buffer_splits)
             ):
                 if "vmap" in kwargs_pruned and i > 0:
                     # the tensordict is already expended
@@ -259,15 +269,14 @@ def forward(
             kwargs_pruned = {
                 key: item for key, item in kwargs.items() if key not in ("params",)
             }
-            param_splits = [param_splits[i] for i in id_to_keep]
-            for i, (module, param) in enumerate(zip(modules, param_splits)):
+            for i, (module, param) in enumerate(zip(self.module, param_splits)):
                 if "vmap" in kwargs_pruned and i > 0:
                     # the tensordict is already expended
                     kwargs_pruned["vmap"] = (0, *(0,) * len(module.in_keys))
                 tensordict = module(tensordict, params=param, **kwargs_pruned)
 
         elif not len(kwargs):
-            for module in modules:
+            for module in self.module:
                 tensordict = module(tensordict)
         else:
             raise RuntimeError(