Skip to content
This repository has been archived by the owner on Apr 23, 2024. It is now read-only.

update config for tpu inference of repr #2

Merged
merged 1 commit into from
Apr 15, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
12 changes: 6 additions & 6 deletions muzero/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,7 @@ class TrainConfig:
batchsize: int = 512
total_training_steps: int = 1_000_000
log_period: int = 10
ckpt_save_interval_steps: int = 50
ckpt_save_interval_steps: int = 100
# TEST:
# batchsize: int = 8
# log_period: int = 1
Expand All @@ -65,15 +65,15 @@ class ReplayConfig:
class InferenceConfig:
"""training configuration for MZ."""

dyna_batch_size: int = 16
repr_batch_size: int = 8
dyna_time_out: float = 0.0005
dyna_batch_size: int = 32
repr_batch_size: int = 16
dyna_time_out: float = 0.00001
repr_time_out: float = 0.001
dyna_update_interval: int = (
75000 # repr_update_interval * num_simulations in mcts/utils.py
5000 # repr_update_interval * num_simulations in mcts/utils.py
)
repr_update_interval: int = 1500
dyna_actor_per_replica: int = 80
dyna_actor_per_replica: int = 50
repr_actor_per_replica: int = 80


Expand Down
1 change: 1 addition & 0 deletions muzero/ray_inference.py
Original file line number Diff line number Diff line change
Expand Up @@ -237,6 +237,7 @@ def dyna_and_pred(params, embedding, action):
if latest_step is None:
latest_step = 0
print(f"need to load actor latest_ckpt_step={latest_step}")
self.step = latest_step
while True:
try:
restored = self._ckpt_manager.restore(latest_step)
Expand Down
Loading
Loading