Skip to content

Commit

Permalink
freeze recovery actor, new rewards, rollback, 935.
Browse files Browse the repository at this point in the history
  • Loading branch information
Kaiyotech committed Feb 4, 2023
1 parent 0c06c0c commit 4053b9b
Show file tree
Hide file tree
Showing 2 changed files with 13 additions and 13 deletions.
16 changes: 8 additions & 8 deletions learner_recovery.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,10 +55,10 @@
ent_coef=0.01,
)

run_id = "recovery_run11.01"
run_id = "recovery_run11.02"
wandb.login(key=os.environ["WANDB_KEY"])
logger = wandb.init(dir="./wandb_store",
name="Recovery_Run11.01",
name="Recovery_Run11.02",
project="Opti",
entity="kaiyotech",
id=run_id,
Expand Down Expand Up @@ -92,19 +92,19 @@
boost_spend_w=4,
punish_boost=True,
touch_ball_w=2.5,
boost_remain_touch_w=1.75,
boost_remain_touch_w=2,
touch_grass_w=0,
supersonic_bonus_vpb_w=0,
zero_touch_grass_if_ss=False,
turtle_w=0,
final_reward_ball_dist_w=1,
final_reward_boost_w=0.2,
final_reward_boost_w=0.3,
forward_ctrl_w=0,
tick_skip=Constants_recovery.FRAME_SKIP,
curve_wave_zap_dash_w=0.1,
curve_wave_zap_dash_w=0.15,
walldash_w=0.35,
jump_high_speed_w=-1,
slow_w=-0.5,
jump_high_speed_w=-0.02,
slow_w=-0.01,
),
lambda: CoyoteAction(),
save_every=logger.config.save_every * 3,
Expand Down Expand Up @@ -177,6 +177,6 @@
alg.agent.optimizer.param_groups[0]["lr"] = logger.config.actor_lr
alg.agent.optimizer.param_groups[1]["lr"] = logger.config.critic_lr

alg.freeze_policy(100)
alg.freeze_policy(60)

alg.run(iterations_per_save=logger.config.save_every, save_dir="recovery_saves")
10 changes: 5 additions & 5 deletions worker_recovery.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,19 +26,19 @@
boost_spend_w=4,
punish_boost=True,
touch_ball_w=2.5,
boost_remain_touch_w=1.75,
boost_remain_touch_w=2,
touch_grass_w=0,
supersonic_bonus_vpb_w=0,
zero_touch_grass_if_ss=False,
turtle_w=0,
final_reward_ball_dist_w=1,
final_reward_boost_w=0.2,
final_reward_boost_w=0.3,
forward_ctrl_w=0,
tick_skip=Constants_recovery.FRAME_SKIP,
curve_wave_zap_dash_w=0.1,
curve_wave_zap_dash_w=0.15,
walldash_w=0.35,
jump_high_speed_w=-1,
slow_w=-0.5,
jump_high_speed_w=-0.02,
slow_w=-0.01,
)

fps = 120 // frame_skip
Expand Down

0 comments on commit 4053b9b

Please sign in to comment.