able to move the experience to cpu easily, and auto matically move it to the device of the dynamics world model when learning from it

2025-11-09 16:16:13 +00:00 · 2025-11-09 16:16:13 +00:00 · cfd34f1eba
commit cfd34f1eba
parent 24ef72d528
4 changed files with 19 additions and 3 deletions
--- a/dreamer4/dreamer4.py
+++ b/dreamer4/dreamer4.py
@ -14,7 +14,7 @@ from torch.nested import nested_tensor
 from torch.distributions import Normal, kl
 from torch.nn import Module, ModuleList, Embedding, Parameter, Sequential, Linear, RMSNorm, Identity
 from torch import nn, cat, stack, arange, tensor, Tensor, is_tensor, full, zeros, ones, randint, rand, randn, randn_like, empty, full, linspace, arange
-from torch.utils._pytree import tree_flatten, tree_unflatten
+from torch.utils._pytree import tree_map, tree_flatten, tree_unflatten

 import torchvision
 from torchvision.models import VGG16_Weights
@ -91,6 +91,14 @@ class Experience:
    agent_index: int = 0
    is_from_world_model: bool = True

+    def cpu(self):
+        return self.to(torch.device('cpu'))
+
+    def to(self, device):
+        experience_dict = asdict(self)
+        experience_dict = tree_map(lambda t: t.to(device) if is_tensor(t) else t, experience_dict)
+        return Experience(**experience_dict)
+
 def combine_experiences(
    exps: list[Experiences]
 ) -> Experience:
@ -2435,6 +2443,8 @@ class DynamicsWorldModel(Module):
    ):
        assert isinstance(experience, Experience)

+        experience = experience.to(self.device)
+
        latents = experience.latents
        actions = experience.actions
        old_log_probs = experience.log_probs
--- a/dreamer4/trainers.py
+++ b/dreamer4/trainers.py
@ -528,7 +528,7 @@ class SimTrainer(Module):

                total_experience += num_experience

-                experiences.append(experience)
+                experiences.append(experience.cpu())

            combined_experiences = combine_experiences(experiences)

--- a/pyproject.toml
+++ b/pyproject.toml
@ -1,6 +1,6 @@
 [project]
 name = "dreamer4"
-version = "0.1.4"
+version = "0.1.5"
 description = "Dreamer 4"
 authors = [
    { name = "Phil Wang", email = "lucidrains@gmail.com" }
--- a/tests/test_dreamer.py
+++ b/tests/test_dreamer.py
@ -680,6 +680,12 @@ def test_online_rl(

    combined_experience = combine_experiences([one_experience, another_experience])

+    # quick test moving the experience to different devices
+
+    if torch.cuda.is_available():
+        combined_experience = combined_experience.to(torch.device('cuda'))
+        combined_experience = combined_experience.to(world_model_and_policy.device)
+
    if store_agent_embed:
        assert exists(combined_experience.agent_embed)