@@ -184,8 +184,8 @@ def create_config(env_id, action_space_size, collector_env_num, evaluator_env_nu
184
184
reanalyze_ratio = reanalyze_ratio ,
185
185
n_episode = n_episode ,
186
186
replay_buffer_size = int (5e5 ),
187
- eval_freq = int (1e4 ), # TODO:
188
- # eval_freq=int(2e4),
187
+ # eval_freq=int(1e4), # TODO: 8games
188
+ eval_freq = int (2e4 ), # TODO: 26games
189
189
collector_env_num = collector_env_num ,
190
190
evaluator_env_num = evaluator_env_num ,
191
191
buffer_reanalyze_freq = buffer_reanalyze_freq ,
@@ -204,12 +204,12 @@ def generate_configs(env_id_list, action_space_size, collector_env_num, n_episod
204
204
205
205
206
206
# ========= TODO: global BENCHMARK_NAME =========
207
- exp_name_prefix = f'data_unizero_atari_mt_20250527/atari_{ len (env_id_list )} games_orig_simnorm-kl_vit_moe8_tran-nlayer{ num_layers } _brf{ buffer_reanalyze_freq } _not-share-head_seed{ seed } /'
207
+ # exp_name_prefix = f'data_unizero_atari_mt_20250527/atari_{len(env_id_list)}games_orig_simnorm-kl_vit_moe8_tran-nlayer{num_layers}_brf{buffer_reanalyze_freq}_not-share-head_seed{seed}/'
208
208
209
209
# exp_name_prefix = f'data_unizero_atari_mt_20250522/atari_{len(env_id_list)}games_orig_tran-nlayer{num_layers}_brf{buffer_reanalyze_freq}_not-share-head_seed{seed}/'
210
210
# exp_name_prefix = f'data_unizero_atari_mt_20250527/atari_{len(env_id_list)}games_orig_simnorm-kl_vit_moco-v2_tran-nlayer{num_layers}_brf{buffer_reanalyze_freq}_not-share-head_seed{seed}/'
211
211
212
- exp_name_prefix = f'data_unizero_atari_mt_20250530 /atari_{ len (env_id_list )} games_orig_vit_ln-mse_moe8_tran-nlayer{ num_layers } _brf{ buffer_reanalyze_freq } _not-share-head_seed{ seed } /'
212
+ exp_name_prefix = f'data_unizero_atari_mt_20250601 /atari_{ len (env_id_list )} games_orig_vit_ln-mse_moe8_tran-nlayer{ num_layers } _brf{ buffer_reanalyze_freq } _not-share-head_seed{ seed } /'
213
213
214
214
# exp_name_prefix = f'data_unizero_atari_mt_20250521/atari_{len(env_id_list)}games_orig_simnorm-kl_vit_moe8_taskembed128_tran-nlayer{num_layers}_rr1_brf{buffer_reanalyze_freq}_not-share-head_seed{seed}/'
215
215
@@ -254,7 +254,7 @@ def create_env_manager():
254
254
255
255
=========== volce atari8 =========================
256
256
cd /fs-computility/niuyazhe/puyuan/code/LightZero/
257
- python -m torch.distributed.launch --nproc_per_node=4 --master_port=29502 /fs-computility/niuyazhe/puyuan/code/LightZero/zoo/atari/config/atari_unizero_multitask_segment_ddp_config.py 2>&1 | tee /fs-computility/niuyazhe/puyuan/code/LightZero/log/20250509/uz_mt_atari8_orig_vit_ln -mse_moe8_nlayer8_brf002_seed12.log
257
+ python -m torch.distributed.launch --nproc_per_node=8 --master_port=29502 /fs-computility/niuyazhe/puyuan/code/LightZero/zoo/atari/config/atari_unizero_multitask_segment_ddp_config.py 2>&1 | tee /fs-computility/niuyazhe/puyuan/code/LightZero/log/20250509/uz_mt_atari26_orig_vit_ln -mse_moe8_nlayer8_brf002_seed12.log
258
258
259
259
260
260
=========== cpfs atari8 =========================
@@ -306,7 +306,7 @@ def create_env_manager():
306
306
import os
307
307
308
308
309
- num_games = 8 # 26 # 8
309
+ num_games = 26 # 26 # 8
310
310
num_layers = 8 # ==============TODO==============
311
311
action_space_size = 18
312
312
collector_env_num = 8
@@ -383,7 +383,7 @@ def create_env_manager():
383
383
384
384
385
385
import torch .distributed as dist
386
- for seed in [1 ]:
386
+ for seed in [1 , 2 ]:
387
387
configs = generate_configs (env_id_list , action_space_size , collector_env_num , n_episode , evaluator_env_num ,
388
388
num_simulations , reanalyze_ratio , batch_sizes , num_unroll_steps , infer_context_length ,
389
389
norm_type , seed , buffer_reanalyze_freq , reanalyze_batch_size , reanalyze_partition ,
0 commit comments