diff --git a/learner_recovery.py b/learner_recovery.py index be6d87a..cfd77dd 100644 --- a/learner_recovery.py +++ b/learner_recovery.py @@ -43,8 +43,8 @@ fps = 120 / frame_skip gamma = np.exp(np.log(0.5) / (fps * half_life_seconds)) config = dict( - actor_lr=1e-4, - critic_lr=1e-4, + actor_lr=3e-5, + critic_lr=3e-5, n_steps=Constants_recovery.STEP_SIZE, batch_size=250_000, minibatch_size=125_000, @@ -103,8 +103,8 @@ tick_skip=Constants_recovery.FRAME_SKIP, curve_wave_zap_dash_w=0.15, walldash_w=0.35, - jump_high_speed_w=-0.02, - slow_w=-0.01, + jump_high_speed_w=-0.1, + slow_w=-0.05, ), lambda: CoyoteAction(), save_every=logger.config.save_every * 3, @@ -173,10 +173,10 @@ ) - alg.load("recovery_saves/Opti_1675399228.0879781/Opti_935/checkpoint.pt") + alg.load("recovery_saves/Opti_1675515807.4002893/Opti_1320/checkpoint.pt") alg.agent.optimizer.param_groups[0]["lr"] = logger.config.actor_lr alg.agent.optimizer.param_groups[1]["lr"] = logger.config.critic_lr - alg.freeze_policy(60) + alg.freeze_policy(20) alg.run(iterations_per_save=logger.config.save_every, save_dir="recovery_saves") diff --git a/setter.py b/setter.py index 86389cd..ab66496 100644 --- a/setter.py +++ b/setter.py @@ -216,7 +216,7 @@ def __init__(self, mode, end_object_choice=None): Wavedash(zero_boost_weight=0.7, zero_ball_vel_weight=0.8), RecoverySetter(zero_boost_weight=0.7, zero_ball_vel_weight=0.8) ), - (0.15, 0.2, 0.1, 0.175, 0.15, 0.175, 0.05) + (0.1, 0.1, 0.25, 0.25, 0, 0.15, 0.15) ) ) # self.setters.append( diff --git a/worker_recovery.py b/worker_recovery.py index 6f6015c..bd979c8 100644 --- a/worker_recovery.py +++ b/worker_recovery.py @@ -37,8 +37,8 @@ tick_skip=Constants_recovery.FRAME_SKIP, curve_wave_zap_dash_w=0.15, walldash_w=0.35, - jump_high_speed_w=-0.02, - slow_w=-0.01, + jump_high_speed_w=-0.1, + slow_w=-0.05, ) fps = 120 // frame_skip