@@ -252,7 +252,7 @@ def make_env(env_type, real_env, sim_env_kwargs):
252
252
253
253
def make_agent (
254
254
agent_type , env , policy_hparams , policy_dir , sampling_temp ,
255
- sim_env_kwargs = None , frame_stack_size = None , rollout_agent_type = None ,
255
+ sim_env_kwargs_fn = None , frame_stack_size = None , rollout_agent_type = None ,
256
256
batch_size = None , inner_batch_size = None , env_type = None , ** planner_kwargs
257
257
):
258
258
"""Factory function for Agents."""
@@ -270,7 +270,7 @@ def make_agent(
270
270
batch_size , make_agent (
271
271
rollout_agent_type , env , policy_hparams , policy_dir ,
272
272
sampling_temp , batch_size = inner_batch_size
273
- ), make_env (env_type , env .env , sim_env_kwargs ),
273
+ ), make_env (env_type , env .env , sim_env_kwargs_fn () ),
274
274
lambda env : rl_utils .BatchStackWrapper (env , frame_stack_size ),
275
275
discount_factor = policy_hparams .gae_gamma , ** planner_kwargs
276
276
),
@@ -302,17 +302,18 @@ def make_agent_from_hparams(
302
302
planner_hparams , model_dir , policy_dir , sampling_temp , video_writers = ()
303
303
):
304
304
"""Creates an Agent from hparams."""
305
- sim_env_kwargs = rl .make_simulated_env_kwargs (
306
- base_env , loop_hparams , batch_size = planner_hparams .batch_size ,
307
- model_dir = model_dir
308
- )
305
+ def sim_env_kwargs_fn ():
306
+ return rl .make_simulated_env_kwargs (
307
+ base_env , loop_hparams , batch_size = planner_hparams .batch_size ,
308
+ model_dir = model_dir
309
+ )
309
310
planner_kwargs = planner_hparams .values ()
310
311
planner_kwargs .pop ("batch_size" )
311
312
planner_kwargs .pop ("rollout_agent_type" )
312
313
planner_kwargs .pop ("env_type" )
313
314
return make_agent (
314
315
agent_type , stacked_env , policy_hparams , policy_dir , sampling_temp ,
315
- sim_env_kwargs , loop_hparams .frame_stack_size ,
316
+ sim_env_kwargs_fn , loop_hparams .frame_stack_size ,
316
317
planner_hparams .rollout_agent_type ,
317
318
inner_batch_size = planner_hparams .batch_size ,
318
319
env_type = planner_hparams .env_type ,
0 commit comments