Costa-huang's workspace
Runs
215
Name
0 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
alpha
autotune
batch_size
buffer_size
capture_video
cuda
end_e
env_id
exp_name
exploration_fraction
exploration_noise
gamma
learning_rate
learning_starts
max_grad_norm
n_atoms
noise_clip
policy_frequency
policy_lr
policy_noise
q_lr
seed
start_e
target_network_frequency
tau
torch_deterministic
total_timesteps
track
train_frequency
v_max
v_min
wandb_entity
wandb_project_name
adv_norm_fullbatch
alg
anneal_lr
aux_batch_rollouts
beta_clone
clip_coef
clip_vloss
e_auxiliary
e_policy
ent_coef
env
Finished
-
dosssman
2h 17m 1s
-
-
-
256
1000000
true
true
-
Walker2d-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
1
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 16m 27s
-
-
-
256
1000000
true
true
-
HalfCheetah-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
3
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 15m 52s
-
-
-
256
1000000
true
true
-
HalfCheetah-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
1
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 15m 4s
-
-
-
256
1000000
true
true
-
Walker2d-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
2
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 16m 19s
-
-
-
256
1000000
true
true
-
Hopper-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
1
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 16m 15s
-
-
-
256
1000000
true
true
-
Walker2d-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
3
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 17m 29s
-
-
-
256
1000000
true
true
-
HalfCheetah-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
2
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 15m 26s
-
-
-
256
1000000
true
true
-
Hopper-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
3
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 15m 9s
-
-
-
256
1000000
true
true
-
Hopper-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
2
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
3h 34s
-
-
-
256
1000000
true
true
-
Pusher-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
1
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
3h 4s
-
-
-
256
1000000
true
true
-
Pusher-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
2
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 57m 14s
-
-
-
256
1000000
true
true
-
Pusher-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
3
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 46m 46s
-
-
-
256
1000000
true
true
-
InvertedPendulum-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
2
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 49m 32s
-
-
-
256
1000000
true
true
-
InvertedPendulum-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
1
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
2h 50m 14s
-
-
-
256
1000000
true
true
-
InvertedPendulum-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
3
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
6h 56m 47s
-
-
-
256
1000000
true
true
-
Humanoid-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
1
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
6h 57m 53s
-
-
-
256
1000000
true
true
-
Humanoid-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
3
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
Finished
-
dosssman
6h 57m 13s
-
-
-
256
1000000
true
true
-
Humanoid-v2
ddpg_continuous_action
-
0.1
0.99
0.0003
25000
-
-
0.5
2
-
-
-
2
-
-
0.005
true
1000000
true
-
-
-
openrlbenchmark
cleanrl
-
-
-
-
-
-
-
-
-
-
-
1-18
of 18