We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c21d78b commit 026119dCopy full SHA for 026119d
1 file changed
pufferlib/config/ocean/g2048.ini
@@ -46,6 +46,20 @@ vtrace_rho_clip = 1.6
46
metric = score
47
goal = maximize
48
49
+[sweep.train.total_timesteps]
50
+distribution = log_normal
51
+min = 3e8
52
+max = 1e10
53
+mean = 1e9
54
+scale = time
55
+
56
+[sweep.train.learning_rate]
57
58
+min = 0.00001
59
+mean = 0.001
60
+max = 0.1
61
+scale = 0.5
62
63
[sweep.train.gae_lambda]
64
distribution = logit_normal
65
min = 0.01
0 commit comments