We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 85324a5 commit 59c3cf4Copy full SHA for 59c3cf4
1 file changed
config/ocean/drmario.ini
@@ -0,0 +1,45 @@
1
+[base]
2
+env_name = drmario
3
+
4
+[vec]
5
+total_agents = 1536
6
+num_buffers = 4
7
+num_threads = 4
8
9
+[env]
10
+n_rows = 16
11
+n_cols = 8
12
+n_init_viruses = 4
13
14
+[policy]
15
+hidden_size = 128
16
+num_layers = 1
17
18
+[legacy]
19
+torch_deterministic = 1
20
+cpu_offload = 0
21
+compile = 1
22
+compile_fullgraph = 0
23
24
+[train]
25
+total_timesteps = 500_000_000
26
+learning_rate = 0.001
27
+gamma = 0.99
28
+gae_lambda = 0.95
29
+clip_coef = 0.2
30
+vf_coef = 0.5
31
+ent_coef = 0.01
32
+minibatch_size = 16384
33
+horizon = 128
34
+use_rnn = 0
35
36
+#copied from Breakout
37
+beta1 = 0.9
38
+beta2 = 0.999
39
+eps = 1e-8
40
+max_grad_norm = 1.0
41
+replay_ratio = 2
42
+vtrace_rho_clip = 2.0
43
+vtrace_c_clip = 2.0
44
+prio_alpha = 0.6
45
+prio_beta0 = 0.9
0 commit comments