Skip to content

Commit 71492e5

Browse files
committed
add additional configs with shorter unroll lengths
1 parent 09e98c6 commit 71492e5

File tree

4 files changed

+76
-20
lines changed

4 files changed

+76
-20
lines changed

experiment_code/mrunner_exps/ICLR_baselines/2023_20_09_monk-APPO-AA-CEAA-T.py

Lines changed: 22 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -24,12 +24,6 @@
2424
"use_resnet": True,
2525
"model": "NetHackNetTtyrec",
2626
"unfreeze_actor_steps": 50_000_000,
27-
"actor_batch_size": 64,
28-
"batch_size": 32,
29-
"virtual_batch_size": 32,
30-
"ttyrec_batch_size": 128,
31-
"unroll_length": 80,
32-
"ttyrec_unroll_length": 80,
3327
}
3428

3529
# params different between exps
@@ -40,10 +34,32 @@
4034
"baseline_cost": [0.5],
4135
"reward_clip": [False],
4236
"adam_learning_rate": [0.0002],
37+
"actor_batch_size": [64],
38+
"batch_size": [32],
39+
"virtual_batch_size": [32],
40+
"ttyrec_batch_size": [128],
41+
"unroll_length": [80],
42+
"ttyrec_unroll_length": [80],
4343
},
4444
{
4545
"seed": list(range(5)),
4646
"adam_learning_rate": [0.001],
47+
"actor_batch_size": [64],
48+
"batch_size": [32],
49+
"virtual_batch_size": [32],
50+
"ttyrec_batch_size": [128],
51+
"unroll_length": [80],
52+
"ttyrec_unroll_length": [80],
53+
},
54+
{
55+
"seed": list(range(5)),
56+
"adam_learning_rate": [0.001],
57+
"actor_batch_size": [128],
58+
"batch_size": [64],
59+
"virtual_batch_size": [64],
60+
"ttyrec_batch_size": [256],
61+
"unroll_length": [32],
62+
"ttyrec_unroll_length": [32],
4763
},
4864
]
4965

experiment_code/mrunner_exps/ICLR_baselines/2023_20_09_monk-APPO-AA-KLAA-T.py

Lines changed: 22 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -26,12 +26,6 @@
2626
"use_resnet": True,
2727
"model": "NetHackNetTtyrec",
2828
"unfreeze_actor_steps": 50_000_000,
29-
"actor_batch_size": 64,
30-
"batch_size": 32,
31-
"virtual_batch_size": 32,
32-
"ttyrec_batch_size": 128,
33-
"unroll_length": 80,
34-
"ttyrec_unroll_length": 80,
3529
}
3630

3731
# params different between exps
@@ -42,10 +36,32 @@
4236
"baseline_cost": [0.5],
4337
"reward_clip": [False],
4438
"adam_learning_rate": [0.0002],
39+
"actor_batch_size": [64],
40+
"batch_size": [32],
41+
"virtual_batch_size": [32],
42+
"ttyrec_batch_size": [128],
43+
"unroll_length": [80],
44+
"ttyrec_unroll_length": [80],
4545
},
4646
{
4747
"seed": list(range(5)),
4848
"adam_learning_rate": [0.001],
49+
"actor_batch_size": [64],
50+
"batch_size": [32],
51+
"virtual_batch_size": [32],
52+
"ttyrec_batch_size": [128],
53+
"unroll_length": [80],
54+
"ttyrec_unroll_length": [80],
55+
},
56+
{
57+
"seed": list(range(5)),
58+
"adam_learning_rate": [0.001],
59+
"actor_batch_size": [128],
60+
"batch_size": [64],
61+
"virtual_batch_size": [64],
62+
"ttyrec_batch_size": [256],
63+
"unroll_length": [32],
64+
"ttyrec_unroll_length": [32],
4965
},
5066
]
5167

experiment_code/mrunner_exps/ICLR_baselines/2023_20_09_monk-APPO-AA-KS-T.py

Lines changed: 16 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -25,10 +25,6 @@
2525
"use_resnet": True,
2626
"model": "NetHackNetTtyrec",
2727
"unfreeze_actor_steps": 50_000_000,
28-
"actor_batch_size": 64,
29-
"batch_size": 32,
30-
"virtual_batch_size": 32,
31-
"unroll_length": 80,
3228
}
3329

3430
# params different between exps
@@ -39,10 +35,26 @@
3935
"baseline_cost": [0.5],
4036
"reward_clip": [False],
4137
"adam_learning_rate": [0.0002],
38+
"actor_batch_size": [64],
39+
"batch_size": [32],
40+
"virtual_batch_size": [32],
41+
"unroll_length": [80],
4242
},
4343
{
4444
"seed": list(range(5)),
4545
"adam_learning_rate": [0.001],
46+
"actor_batch_size": [64],
47+
"batch_size": [32],
48+
"virtual_batch_size": [32],
49+
"unroll_length": [80],
50+
},
51+
{
52+
"seed": list(range(5)),
53+
"adam_learning_rate": [0.001],
54+
"actor_batch_size": [128],
55+
"batch_size": [64],
56+
"virtual_batch_size": [64],
57+
"unroll_length": [32],
4658
},
4759
]
4860

experiment_code/mrunner_exps/ICLR_baselines/2023_20_09_monk-APPO-T.py

Lines changed: 16 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -22,10 +22,6 @@
2222
"use_resnet": True,
2323
"model": "NetHackNetTtyrec",
2424
"unfreeze_actor_steps": 50_000_000,
25-
"actor_batch_size": 64,
26-
"batch_size": 32,
27-
"virtual_batch_size": 32,
28-
"unroll_length": 80,
2925
}
3026

3127
# params different between exps
@@ -36,10 +32,26 @@
3632
"baseline_cost": [0.5],
3733
"reward_clip": [False],
3834
"adam_learning_rate": [0.0002],
35+
"actor_batch_size": [64],
36+
"batch_size": [32],
37+
"virtual_batch_size": [32],
38+
"unroll_length": [80],
3939
},
4040
{
4141
"seed": list(range(5)),
4242
"adam_learning_rate": [0.001],
43+
"actor_batch_size": [64],
44+
"batch_size": [32],
45+
"virtual_batch_size": [32],
46+
"unroll_length": [80],
47+
},
48+
{
49+
"seed": list(range(5)),
50+
"adam_learning_rate": [0.001],
51+
"actor_batch_size": [128],
52+
"batch_size": [64],
53+
"virtual_batch_size": [64],
54+
"unroll_length": [32],
4355
},
4456
]
4557

0 commit comments

Comments
 (0)