diff --git a/tmrl/config/config_objects.py b/tmrl/config/config_objects.py index a80676c..b1e5fe1 100644 --- a/tmrl/config/config_objects.py +++ b/tmrl/config/config_objects.py @@ -140,7 +140,7 @@ def sac_v2_entropy_scheduler(agent, epoch): agent_scheduler=None, # sac_v2_entropy_scheduler start_training=cfg.TMRL_CONFIG["ENVIRONMENT_STEPS_BEFORE_TRAINING"]) # set this > 0 to start from an existing policy (fills the buffer up to this number of samples before starting training) else: # images - TRAINER = partial0( + TRAINER = partial( TrainingOffline, Env=partial(UntouchedGymEnv, id="rtgym:real-time-gym-v0", gym_kwargs={"config": CONFIG_DICT}), Memory=MEMORY,