@@ -17,8 +17,8 @@ def create_config(env_id, observation_shape_list, action_space_size_list, collec
17
17
action_space_size_list = action_space_size_list ,
18
18
from_pixels = False ,
19
19
# ===== only for debug =====
20
- frame_skip = 50 , # 100
21
- # frame_skip=2,
20
+ # frame_skip=50, # 100
21
+ frame_skip = 2 ,
22
22
continuous = True , # Assuming all DMC tasks use continuous action spaces
23
23
collector_env_num = collector_env_num ,
24
24
evaluator_env_num = evaluator_env_num ,
@@ -156,7 +156,7 @@ def generate_configs(env_id_list: List[str],
156
156
# TODO: debug
157
157
# exp_name_prefix = f'data_suz_mt_20250113/ddp_8gpu_nlayer8_upc200_taskweight-eval1e3-10k-temp10-1_task-embed_{len(env_id_list)}tasks_brf{buffer_reanalyze_freq}_tbs{total_batch_size}_seed{seed}/'
158
158
159
- exp_name_prefix = f'data_suz_mt_20250207_debug/ddp_2gpu -moco_nlayer8_upc200_notaskweight_no-task-embed_{ len (env_id_list )} tasks_brf{ buffer_reanalyze_freq } _tbs{ total_batch_size } _seed{ seed } /'
159
+ exp_name_prefix = f'data_suz_mt_20250207/ddp_8gpu -moco_nlayer8_upc200_notaskweight_no-task-embed_{ len (env_id_list )} tasks_brf{ buffer_reanalyze_freq } _tbs{ total_batch_size } _seed{ seed } /'
160
160
161
161
# exp_name_prefix = f'data_suz_mt_20250113/ddp_3gpu_3games_nlayer8_upc200_notusp_notaskweight-symlog-01-05-eval1e3_{len(env_id_list)}tasks_brf{buffer_reanalyze_freq}_tbs{total_batch_size}_seed{seed}/'
162
162
@@ -208,7 +208,7 @@ def create_env_manager():
208
208
Overview:
209
209
This script should be executed with <nproc_per_node> GPUs.
210
210
Run the following command to launch the script:
211
- python -m torch.distributed.launch --nproc_per_node=2 --master_port=29500 ./zoo/dmc2gym/config/dmc2gym_state_suz_multitask_ddp_8games_moco_config.py
211
+ python -m torch.distributed.launch --nproc_per_node=2 --master_port=29501 ./zoo/dmc2gym/config/dmc2gym_state_suz_multitask_ddp_8games_moco_config.py
212
212
torchrun --nproc_per_node=8 ./zoo/dmc2gym/config/dmc2gym_state_suz_multitask_ddp_config.py
213
213
"""
214
214
@@ -239,16 +239,16 @@ def create_env_manager():
239
239
# ]
240
240
241
241
# DMC 8games
242
- # env_id_list = [
243
- # 'acrobot-swingup',
244
- # 'cartpole-balance',
245
- # 'cartpole-balance_sparse',
246
- # 'cartpole-swingup',
247
- # 'cartpole-swingup_sparse',
248
- # 'cheetah-run',
249
- # "ball_in_cup-catch",
250
- # "finger-spin",
251
- # ]
242
+ env_id_list = [
243
+ 'acrobot-swingup' ,
244
+ 'cartpole-balance' ,
245
+ 'cartpole-balance_sparse' ,
246
+ 'cartpole-swingup' ,
247
+ 'cartpole-swingup_sparse' ,
248
+ 'cheetah-run' ,
249
+ "ball_in_cup-catch" ,
250
+ "finger-spin" ,
251
+ ]
252
252
253
253
# DMC 18games
254
254
# env_id_list = [
@@ -302,12 +302,12 @@ def create_env_manager():
302
302
reanalyze_partition = 0.75
303
303
304
304
# ======== TODO: only for debug ========
305
- collector_env_num = 2
306
- num_segments = 2
307
- n_episode = 2
308
- evaluator_env_num = 2
309
- num_simulations = 1
310
- batch_size = [4 for _ in range (len (env_id_list ))]
305
+ # collector_env_num = 2
306
+ # num_segments = 2
307
+ # n_episode = 2
308
+ # evaluator_env_num = 2
309
+ # num_simulations = 1
310
+ # batch_size = [4 for _ in range(len(env_id_list))]
311
311
# =======================================
312
312
313
313
seed = 0 # You can iterate over multiple seeds if needed
0 commit comments