Skip to content
This repository was archived by the owner on Jul 7, 2023. It is now read-only.

Commit dabd95e

Browse files
Lukasz Kaisercopybara-github
authored andcommitted
Add 20k and 50k setups for mbrl.
PiperOrigin-RevId: 246410996
1 parent 5eb6e61 commit dabd95e

File tree

1 file changed

+20
-0
lines changed

1 file changed

+20
-0
lines changed

tensor2tensor/rl/trainer_model_based_params.py

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -332,6 +332,26 @@ def rlmb_base_stochastic_discrete_sticky_actions():
332332
return hparams
333333

334334

335+
@registry.register_hparams
336+
def rlmb_base_stochastic_discrete_20k():
337+
"""Base setting with stochastic discrete model with 20k steps."""
338+
hparams = rlmb_base_stochastic_discrete()
339+
# Our num_real_env_frames should be divisible by real_ppo_epoch_length*epochs
340+
# Here we decrease epochs to 6 and make this number 16*200*6.
341+
hparams.num_real_env_frames = 19200
342+
hparams.epochs = 6
343+
hparams.ppo_epochs_num = 2000 # Increase PPO steps as we have less epochs.
344+
return hparams
345+
346+
347+
@registry.register_hparams
348+
def rlmb_base_stochastic_discrete_50k():
349+
"""Base setting with stochastic discrete model with 50k steps."""
350+
hparams = rlmb_base_stochastic_discrete()
351+
hparams.num_real_env_frames = 48000
352+
return hparams
353+
354+
335355
@registry.register_hparams
336356
def rlmb_base_stochastic_discrete_75k_model_steps():
337357
"""Base setting with stochastic discrete model with 75k WM steps."""

0 commit comments

Comments
 (0)