diff --git a/dreamer4/dreamer4.py b/dreamer4/dreamer4.py index e0f8adc..a3cc903 100644 --- a/dreamer4/dreamer4.py +++ b/dreamer4/dreamer4.py @@ -2870,6 +2870,13 @@ class DynamicsWorldModel(Module): space_tokens = self.latents_to_spatial_tokens(noised_latents) + # maybe add view embedding + + if self.video_has_multi_view: + space_tokens = add('b t v ... d, v d', space_tokens, self.view_emb) + + # merge spatial tokens + space_tokens, inverse_pack_space_per_latent = pack_one(space_tokens, 'b t * d') num_spatial_tokens = space_tokens.shape[-2] diff --git a/pyproject.toml b/pyproject.toml index bca30ee..8981fb6 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [project] name = "dreamer4" -version = "0.0.74" +version = "0.0.75" description = "Dreamer 4" authors = [ { name = "Phil Wang", email = "lucidrains@gmail.com" }