Costa-huang's workspace
Runs
6
Name
6 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
anneal_lr
batch_size
capture_video
clip_coef
clip_vloss
cuda
ent_coef
eval_frequency
eval_levels
exp_name
ext_coef
gae
gae_lambda
gamma
griddly_level
griddly_max_steps
gym_id
int_coef
int_gamma
kle_rollback
kle_stop
learning_rate
max_grad_norm
minibatch_size
n_minibatch
norm_adv
num_envs
num_steps
prod_mode
seed
sticky_action
target_kl
torch_deterministic
total_timesteps
train_levels
update_epochs
update_proportion
vf_coef
video_interval
wandb_entity
wandb_project_name
charts/episode_curiosity_reward
charts/episode_reward
charts/learning_rate
Finished
-
chrisbam4d
1h 54m 39s
-
true
4096
true
0.1
true
true
0.01
10
[1,3]
ppo_rnd_vector_partial
2
true
0.95
0.99
0
128
GDY-Partially-Observable-Zen-Puzzle-v0
1
0.99
false
false
0.00025
0.5
1024
4
true
32
128
true
1
true
0.03
true
10000000
[0,2,4]
4
0.25
0.5
20
chrisbam4d
cleanrl.partial
0.089276
33
1.0242e-7
Finished
-
chrisbam4d
1h 53m 33s
-
true
4096
true
0.1
true
true
0.01
10
[1,3]
ppo_rnd_vector_partial
2
true
0.95
0.99
0
128
GDY-Partially-Observable-Labyrinth-v0
1
0.99
false
false
0.00025
0.5
1024
4
true
32
128
true
1
true
0.03
true
10000000
[0,2,4]
4
0.25
0.5
20
chrisbam4d
cleanrl.partial
0.016503
0
1.0242e-7
Finished
-
chrisbam4d
1h 54m 58s
-
true
4096
true
0.1
true
true
0.01
10
[1,3]
ppo_rnd_vector_partial
2
true
0.95
0.99
0
128
GDY-Partially-Observable-Bait-v0
1
0.99
false
false
0.00025
0.5
1024
4
true
32
128
true
1
true
0.03
true
10000000
[0,2,4]
4
0.25
0.5
20
chrisbam4d
cleanrl.partial
0.030549
7
1.0242e-7
Finished
-
chrisbam4d
2h 43s
-
true
4096
true
0.1
true
true
0.01
10
[1,3]
ppo_rnd_vector_partial
2
true
0.95
0.99
0
128
GDY-Partially-Observable-Clusters-v0
1
0.99
false
false
0.00025
0.5
1024
4
true
32
128
true
1
true
0.03
true
10000000
[0,2,4]
4
0.25
0.5
20
chrisbam4d
cleanrl.partial
0.051763
5
1.0242e-7
Finished
-
chrisbam4d
1h 53m 8s
-
true
4096
true
0.1
true
true
0.01
10
[1,3]
ppo_rnd_vector_partial
2
true
0.95
0.99
0
128
GDY-Partially-Observable-Cook-Me-Pasta-v0
1
0.99
false
false
0.00025
0.5
1024
4
true
32
128
true
1
true
0.03
true
10000000
[0,2,4]
4
0.25
0.5
20
chrisbam4d
cleanrl.partial
0.019928
4
1.0242e-7
Finished
-
chrisbam4d
1h 42m 34s
-
true
4096
true
0.1
true
true
0.01
10
[1,3]
ppo_rnd_vector_partial
2
true
0.95
0.99
0
128
GDY-Partially-Observable-Sokoban---2-v0
1
0.99
false
false
0.00025
0.5
1024
4
true
32
128
true
1
true
0.03
true
10000000
[0,2,4]
4
0.25
0.5
20
chrisbam4d
cleanrl.partial
0.098752
3
1.0242e-7
1-6
of 6