wire up the time kv cache when interacting with sim / env

2025-10-22 08:39:11 -07:00 · 2025-10-22 08:39:11 -07:00 · 7ecc5d03e8
commit 7ecc5d03e8
parent d82debb7a6
2 changed files with 16 additions and 3 deletions
--- a/dreamer4/dreamer4.py
+++ b/dreamer4/dreamer4.py
@ -1972,7 +1972,8 @@ class DynamicsWorldModel(Module):
        seed = None,
        agent_index = 0,
        step_size = 4,
-        max_timesteps = 16
+        max_timesteps = 16,
+        use_time_kv_cache = True
    ):
        assert exists(self.video_tokenizer)

@ -1990,22 +1991,34 @@ class DynamicsWorldModel(Module):
        values = None
        latents = None

+        # maybe time kv cache
+
+        time_kv_cache = None
+
        for _ in range(max_timesteps):

            latents = self.video_tokenizer(video, return_latents = True)

-            _, (agent_embed, _) = self.forward(
+            _, (agent_embed, next_time_kv_cache) = self.forward(
                latents = latents,
                signal_levels = self.max_steps - 1,
                step_sizes = step_size,
                rewards = rewards,
                discrete_actions = discrete_actions,
                continuous_actions = continuous_actions,
+                time_kv_cache = time_kv_cache,
                latent_is_noised = True,
                return_pred_only = True,
                return_intermediates = True
            )

+            # time kv cache
+
+            if use_time_kv_cache:
+                time_kv_cache = next_time_kv_cache
+
+            # get one agent
+
            one_agent_embed = agent_embed[..., -1:, agent_index, :]

            policy_embed = self.policy_head(one_agent_embed)
--- a/pyproject.toml
+++ b/pyproject.toml
@ -1,6 +1,6 @@
 [project]
 name = "dreamer4"
-version = "0.0.61"
+version = "0.0.62"
 description = "Dreamer 4"
 authors = [
    { name = "Phil Wang", email = "lucidrains@gmail.com" }