Bragajj's workspace
Runs
27
Name
27 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
anneal_lr
batch_size
buffer_size
capture_video
clip_coef
clip_vloss
cuda
end_e
ent_coef
env_id
exp_name
exploration_fraction
gae
gae_lambda
gamma
learning_rate
learning_starts
max_grad_norm
minibatch_size
norm_adv
num_envs
num_minibatches
num_steps
seed
start_e
target_network_frequency
torch_deterministic
total_timesteps
track
train_frequency
update_epochs
vf_coef
wandb_entity
wandb_project_name
charts/SPS
charts/episodic_length
charts/episodic_return
charts/epsilon
charts/learning_rate
global_step
losses/approx_kl
losses/clipfrac
losses/entropy
losses/explained_variance
Finished
-
costa-huang
3m 10s
-
-
128
10000
true
-
-
false
0.05
-
Acrobot-v1
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
3
1
500
true
500000
true
10
-
-
cleanrl
benchmark
2816
-
-83
0.05
-
499960
-
-
-
-
Finished
-
costa-huang
2m 39s
-
-
128
10000
true
-
-
false
0.05
-
MountainCar-v0
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
3
1
500
true
500000
true
10
-
-
cleanrl
benchmark
3428
-
-152
0.05
-
499939
-
-
-
-
Finished
-
costa-huang
3m 14s
-
-
128
10000
true
-
-
false
0.05
-
Acrobot-v1
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
2
1
500
true
500000
true
10
-
-
cleanrl
benchmark
2758
-
-100
0.05
-
499992
-
-
-
-
Finished
-
costa-huang
2m 38s
-
-
128
10000
true
-
-
false
0.05
-
MountainCar-v0
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
2
1
500
true
500000
true
10
-
-
cleanrl
benchmark
3458
-
-200
0.05
-
499900
-
-
-
-
Finished
-
costa-huang
2m 39s
-
-
128
10000
true
-
-
false
0.05
-
MountainCar-v0
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
500000
true
10
-
-
cleanrl
benchmark
3441
-
-200
0.05
-
499905
-
-
-
-
Finished
-
costa-huang
3m 17s
-
-
128
10000
true
-
-
false
0.05
-
Acrobot-v1
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
500000
true
10
-
-
cleanrl
benchmark
2730
-
-75
0.05
-
499961
-
-
-
-
Finished
-
costa-huang
2m 19s
-
-
128
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
3
1
500
true
500000
true
10
-
-
cleanrl
benchmark
3966
-
500
0.05
-
499900
-
-
-
-
Finished
-
costa-huang
2m 18s
-
-
128
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
2
1
500
true
500000
true
10
-
-
cleanrl
benchmark
3982
-
385
0.05
-
499900
-
-
-
-
Finished
-
costa-huang
2m 20s
-
-
128
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.5
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
500000
true
10
-
-
cleanrl
benchmark
3920
-
500
0.05
-
499900
-
-
-
-
Finished
-
costa-huang
2m 16s
-
-
128
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
500000
true
10
-
-
cleanrl
benchmark
4043
-
500
0.05
-
499900
-
-
-
-
Finished
-
costa-huang
8s
-
-
32
10000
true
-
-
false
0.05
-
MountainCar-v0
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
3
1
500
true
500000
true
1
-
-
cleanrl
benchmark
-
-
-
-
-
-
-
-
-
-
Finished
-
costa-huang
4s
-
-
32
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
3
1
500
true
500000
true
1
-
-
cleanrl
benchmark
-
-
-
-
-
-
-
-
-
-
Finished
-
costa-huang
10s
-
-
32
10000
true
-
-
false
0.05
-
MountainCar-v0
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
2
1
500
true
500000
true
1
-
-
cleanrl
benchmark
-
-
-
-
-
-
-
-
-
-
Killed
-
costa-huang
17s
-
-
32
10000
true
-
-
false
0.05
-
Acrobot-v1
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
2
1
500
true
500000
true
1
-
-
cleanrl
benchmark
-
-
-500
0.99763
-
999
-
-
-
-
Finished
-
costa-huang
34s
-
-
32
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
2
1
500
true
25000
true
1
-
-
cleanrl
benchmark
1173
-
179
0.05
-
24909
-
-
-
-
Finished
-
costa-huang
36s
-
-
32
10000
true
-
-
false
0.05
-
MountainCar-v0
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
25000
true
1
-
-
cleanrl
benchmark
1095
-
-200
0.05
-
24999
-
-
-
-
Finished
-
costa-huang
40s
-
-
32
10000
true
-
-
false
0.05
-
Acrobot-v1
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
25000
true
1
-
-
cleanrl
benchmark
918
-
-263
0.05
-
24900
-
-
-
-
Finished
-
costa-huang
34s
-
-
32
10000
true
-
-
false
0.05
-
CartPole-v1
dqn
0.8
-
-
0.99
0.00025
10000
0.5
-
-
-
-
-
1
1
500
true
25000
true
1
-
-
cleanrl
benchmark
1224
-
228
0.05
-
24900
-
-
-
-
Finished
-
costa-huang
3m 25s
-
true
512
-
true
0.2
true
false
-
0.01
Acrobot-v1
ppo
-
true
0.95
0.99
0.00025
-
0.5
128
true
4
4
128
3
-
-
true
500000
true
-
4
0.5
cleanrl
benchmark
2596
80
-79
-
2.5615e-7
499712
0
0
0.13535
0.93773
Finished
-
costa-huang
2m 30s
-
true
512
-
true
0.2
true
false
-
0.01
MountainCar-v0
ppo
-
true
0.95
0.99
0.00025
-
0.5
128
true
4
4
128
3
-
-
true
500000
true
-
4
0.5
cleanrl
benchmark
3637
200
-200
-
2.5615e-7
499712
9.3132e-9
0
1.01912
-0.000074744
1-20
of 27