Skip to content

Commit

Permalink
recovery slight reward changes, setter changes, LR down. Slight freeze.
Browse files Browse the repository at this point in the history
  • Loading branch information
Kaiyotech committed Feb 5, 2023
1 parent 4053b9b commit 5b07386
Show file tree
Hide file tree
Showing 3 changed files with 9 additions and 9 deletions.
12 changes: 6 additions & 6 deletions learner_recovery.py
Original file line number Diff line number Diff line change
Expand Up @@ -43,8 +43,8 @@
fps = 120 / frame_skip
gamma = np.exp(np.log(0.5) / (fps * half_life_seconds))
config = dict(
actor_lr=1e-4,
critic_lr=1e-4,
actor_lr=3e-5,
critic_lr=3e-5,
n_steps=Constants_recovery.STEP_SIZE,
batch_size=250_000,
minibatch_size=125_000,
Expand Down Expand Up @@ -103,8 +103,8 @@
tick_skip=Constants_recovery.FRAME_SKIP,
curve_wave_zap_dash_w=0.15,
walldash_w=0.35,
jump_high_speed_w=-0.02,
slow_w=-0.01,
jump_high_speed_w=-0.1,
slow_w=-0.05,
),
lambda: CoyoteAction(),
save_every=logger.config.save_every * 3,
Expand Down Expand Up @@ -173,10 +173,10 @@

)

alg.load("recovery_saves/Opti_1675399228.0879781/Opti_935/checkpoint.pt")
alg.load("recovery_saves/Opti_1675515807.4002893/Opti_1320/checkpoint.pt")
alg.agent.optimizer.param_groups[0]["lr"] = logger.config.actor_lr
alg.agent.optimizer.param_groups[1]["lr"] = logger.config.critic_lr

alg.freeze_policy(60)
alg.freeze_policy(20)

alg.run(iterations_per_save=logger.config.save_every, save_dir="recovery_saves")
2 changes: 1 addition & 1 deletion setter.py
Original file line number Diff line number Diff line change
Expand Up @@ -216,7 +216,7 @@ def __init__(self, mode, end_object_choice=None):
Wavedash(zero_boost_weight=0.7, zero_ball_vel_weight=0.8),
RecoverySetter(zero_boost_weight=0.7, zero_ball_vel_weight=0.8)
),
(0.15, 0.2, 0.1, 0.175, 0.15, 0.175, 0.05)
(0.1, 0.1, 0.25, 0.25, 0, 0.15, 0.15)
)
)
# self.setters.append(
Expand Down
4 changes: 2 additions & 2 deletions worker_recovery.py
Original file line number Diff line number Diff line change
Expand Up @@ -37,8 +37,8 @@
tick_skip=Constants_recovery.FRAME_SKIP,
curve_wave_zap_dash_w=0.15,
walldash_w=0.35,
jump_high_speed_w=-0.02,
slow_w=-0.01,
jump_high_speed_w=-0.1,
slow_w=-0.05,
)

fps = 120 // frame_skip
Expand Down

0 comments on commit 5b07386

Please sign in to comment.