modified network structures to match the paper

This commit is contained in:
NM512 2023-02-18 10:13:02 +09:00
parent fb5c21557a
commit f96ad071d1
2 changed files with 6 additions and 5 deletions

View File

@ -6,7 +6,7 @@ defaults:
offline_traindir: ''
offline_evaldir: ''
seed: 0
steps: 5e5
steps: 1e6
eval_every: 1e4
log_every: 1e4
reset_every: 0
@ -36,8 +36,8 @@ defaults:
dyn_deter: 512
dyn_stoch: 32
dyn_discrete: 32
dyn_input_layers: 1
dyn_output_layers: 1
dyn_input_layers: 2
dyn_output_layers: 2
dyn_rec_depth: 1
dyn_shared: False
dyn_mean_act: 'none'
@ -45,7 +45,7 @@ defaults:
dyn_min_std: 0.1
dyn_temp_post: True
grad_heads: ['image', 'reward', 'discount']
units: 256
units: 512
reward_layers: 2
discount_layers: 2
value_layers: 2
@ -86,7 +86,7 @@ defaults:
oversample_ends: False
slow_value_target: True
slow_actor_target: True
slow_target_update: 50
slow_target_update: 100
slow_target_fraction: 0.01
opt: 'adam'

View File

@ -60,6 +60,7 @@ class RSSM(nn.Module):
inp_dim += self._embed
for i in range(self._layers_input):
inp_layers.append(nn.Linear(inp_dim, self._hidden))
inp_layers.append(self._norm(self._hidden))
inp_layers.append(self._act())
if i == 0:
inp_dim = self._hidden