File tree Expand file tree Collapse file tree 9 files changed +879
-114
lines changed Expand file tree Collapse file tree 9 files changed +879
-114
lines changed Original file line number Diff line number Diff line change 1
1
[base]
2
2
package = nethack
3
3
env_name = nethack
4
+ policy_name = Policy
5
+ rnn_name = Recurrent
4
6
5
7
[vec]
6
- num_envs = 128
8
+ num_envs = 8192
7
9
num_workers = 16
8
- batch_size = 64
10
+ batch_size = 4096
9
11
10
12
[train]
11
- batch_size = 8192
12
- minibatch_size = 2048
13
- update_epochs = 1
13
+ total_timesteps = 90_000_000
14
+ adam_beta1 = 0.8946507418260217
15
+ adam_beta2 = 0.9
16
+ adam_eps = 0.0001
17
+ batch_size = auto
14
18
bptt_horizon = 64
15
- total_timesteps = 10_000_000
16
- anneal_lr = False
19
+ clip_coef = 0.19696765958267629
20
+ ent_coef = 0.0005690816545012474
21
+ gae_lambda = 0.747650023961198
22
+ gamma = 0.9997053654668936
23
+ learning_rate = 0.044482546441415506
24
+ max_grad_norm = 2.2356112188495723
25
+ minibatch_size = 32768
26
+ prio_alpha = 0.98967001208896
27
+ prio_beta0 = 0.09999999999999998
28
+ vf_clip_coef = 2.178492167689251
29
+ vf_coef = 1.6832989594296321
30
+ vtrace_c_clip = 2.878171091654008
31
+ vtrace_rho_clip = 0.7876748061547312
Original file line number Diff line number Diff line change @@ -10,31 +10,32 @@ num_envs = 8
10
10
[env]
11
11
num_envs = 1024
12
12
frameskip = 4
13
- width = 1920
14
- height = 1080
15
- track_width = 50
13
+ width = 1080
14
+ height = 720
15
+ track_width = 75
16
16
num_radial_sectors = 180
17
17
num_points = 16
18
18
bezier_resolution = 4
19
19
turn_pi_frac = 40
20
- w_ang = 0.586 # 0.523
20
+ w_ang = 0.777 # 0. 586 # 0.523
21
21
reward_yellow = 0.2
22
22
reward_green = -0.001
23
23
corner_thresh = 0.5 # dot product for hairpins
24
24
ftmp1 = 0.5 # 0.9
25
25
ftmp2 = 3.0 # 1.05
26
26
ftmp3 = 0.3 # 0.2
27
27
ftmp4 = 0.0
28
- render_many = 1
28
+ mode7 = 0
29
+ render_many = 0
29
30
rng = 6
30
- method = -1
31
+ method = 2
31
32
32
33
[policy]
33
- hidden_size = 64
34
+ hidden_size = 128
34
35
35
36
[rnn]
36
- input_size = 64
37
- hidden_size = 64
37
+ input_size = 128
38
+ hidden_size = 128
38
39
39
40
[train]
40
41
adam_beta1 = 0.9446160612709289
@@ -53,7 +54,7 @@ max_grad_norm = 1.1402446026380597
53
54
minibatch_size = 32768 # 16384 32768
54
55
prio_alpha = 0.8186786991771018
55
56
prio_beta0 = 0.49639773186725333
56
- total_timesteps = 20_000_000
57
+ total_timesteps = 200_000_000
57
58
vf_clip_coef = 1.1492700894337171
58
59
vf_coef = 1.2551354745222134
59
60
vtrace_c_clip = 0
You can’t perform that action at this time.
0 commit comments