File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 22env_name = drmario
33
44[vec]
5- total_agents = 1536
5+ total_agents = 8192
66num_buffers = 4
77num_threads = 4
88
@@ -11,35 +11,5 @@ n_rows = 16
1111n_cols = 8
1212n_init_viruses = 4
1313
14- [policy]
15- hidden_size = 128
16- num_layers = 1
17-
18- [legacy]
19- torch_deterministic = 1
20- cpu_offload = 0
21- compile = 1
22- compile_fullgraph = 0
23-
2414[train]
25- total_timesteps = 500_000_000
26- learning_rate = 0.001
27- gamma = 0.99
28- gae_lambda = 0.95
29- clip_coef = 0.2
30- vf_coef = 0.5
31- ent_coef = 0.01
32- minibatch_size = 16384
33- horizon = 128
34- use_rnn = 0
35-
36- # copied from Breakout
37- beta1 = 0.9
38- beta2 = 0.999
39- eps = 1e-8
40- max_grad_norm = 1.0
41- replay_ratio = 2
42- vtrace_rho_clip = 2.0
43- vtrace_c_clip = 2.0
44- prio_alpha = 0.6
45- prio_beta0 = 0.9
15+ total_timesteps = 200_000_000
Original file line number Diff line number Diff line change 11#include "drmario.h"
22
3- #define OBS_SIZE 133
3+ #define OBS_SIZE 394
44#define NUM_ATNS 1
55#define ACT_SIZES {7}
66#define OBS_TENSOR_T FloatTensor
You can’t perform that action at this time.
0 commit comments