Force kwargs in PolicyWrapperFactoryIntrinsicCuriosity init

2023-10-26 10:43:48 +02:00 · 2023-10-26 10:43:48 +02:00 · da2194eff6
commit da2194eff6
parent 96298eafd8
4 changed files with 19 additions and 18 deletions
--- a/examples/atari/atari_dqn_hl.py
+++ b/examples/atari/atari_dqn_hl.py
@ -88,12 +88,12 @@ def main(
    if icm_lr_scale > 0:
        builder.with_policy_wrapper_factory(
            PolicyWrapperFactoryIntrinsicCuriosity(
-                IntermediateModuleFactoryAtariDQNFeatures(),
+                feature_net_factory=IntermediateModuleFactoryAtariDQNFeatures(),
-                [512],
+                hidden_sizes=[512],
-                lr,
+                lr=lr,
-                icm_lr_scale,
+                lr_scale=icm_lr_scale,
-                icm_reward_scale,
+                reward_scale=icm_reward_scale,
-                icm_forward_loss_weight,
+                forward_loss_weight=icm_forward_loss_weight,
            ),
        )
--- a/examples/atari/atari_ppo_hl.py
+++ b/examples/atari/atari_ppo_hl.py
@ -101,12 +101,12 @@ def main(
    if icm_lr_scale > 0:
        builder.with_policy_wrapper_factory(
            PolicyWrapperFactoryIntrinsicCuriosity(
-                IntermediateModuleFactoryAtariDQNFeatures(),
+                feature_net_factory=IntermediateModuleFactoryAtariDQNFeatures(),
-                [hidden_sizes],
+                hidden_sizes=[hidden_sizes],
-                lr,
+                lr=lr,
-                icm_lr_scale,
+                lr_scale=icm_lr_scale,
-                icm_reward_scale,
+                reward_scale=icm_reward_scale,
-                icm_forward_loss_weight,
+                forward_loss_weight=icm_forward_loss_weight,
            ),
        )
    experiment = builder.build()
--- a/examples/atari/atari_sac_hl.py
+++ b/examples/atari/atari_sac_hl.py
@ -87,12 +87,12 @@ def main(
    if icm_lr_scale > 0:
        builder.with_policy_wrapper_factory(
            PolicyWrapperFactoryIntrinsicCuriosity(
-                IntermediateModuleFactoryAtariDQNFeatures(),
+                feature_net_factory=IntermediateModuleFactoryAtariDQNFeatures(),
-                [hidden_size],
+                hidden_sizes=[hidden_size],
-                actor_lr,
+                lr=actor_lr,
-                icm_lr_scale,
+                lr_scale=icm_lr_scale,
-                icm_reward_scale,
+                reward_scale=icm_reward_scale,
-                icm_forward_loss_weight,
+                forward_loss_weight=icm_forward_loss_weight,
            ),
        )
    experiment = builder.build()
--- a/tianshou/highlevel/params/policy_wrapper.py
+++ b/tianshou/highlevel/params/policy_wrapper.py
@ -30,6 +30,7 @@ class PolicyWrapperFactoryIntrinsicCuriosity(
 ):
    def __init__(
        self,
        *,
        feature_net_factory: IntermediateModuleFactory,
        hidden_sizes: Sequence[int],
        lr: float,