Rickstaa's group workspace
Group: han2020_reproduction_small_actor
Name
75 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
ac_kwargs.activation
ac_kwargs.activation.actor
ac_kwargs.activation.critic
ac_kwargs.hidden_sizes.actor
ac_kwargs.hidden_sizes.critic
ac_kwargs.output_activation
ac_kwargs.output_activation.actor
ac_kwargs.output_activation.critic
actor_critic
adaptive_temperature
alpha
alpha3
batch_size
device
env
env_class
epochs
exp_name
export
gamma
horizon_length
labda
lr_a
lr_a_decay_type
lr_a_final
lr_alpha
lr_alpha_decay_type
lr_alpha_final
lr_c
lr_c_decay_type
lr_c_final
lr_decay_ref
lr_decay_type
lr_labda
lr_labda_decay_type
lr_labda_final
max_ep_len
num_test_episodes
opt_type
polyak
replay_size
save_freq
seed
Finished
-
rickstaa
21m 19s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-1
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
234
Finished
-
rickstaa
21m 46s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-1
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
78456
Finished
-
rickstaa
21m 47s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-3
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
3658
Finished
-
rickstaa
21m 55s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-3
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
567
Finished
-
rickstaa
22m 4s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp1-0
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
48104
Finished
-
rickstaa
22m 8s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp1-0
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
234
Finished
-
rickstaa
21m 56s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-1
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
3658
Finished
-
rickstaa
22m 3s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-3
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
78456
Finished
-
rickstaa
22m 9s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-1
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
567
Finished
-
rickstaa
21m 55s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-1
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
48104
Finished
-
rickstaa
21m 55s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-3
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
234
Finished
-
rickstaa
21m 53s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp1-0
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
3658
Finished
-
rickstaa
22m
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp1-0
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
78456
Finished
-
rickstaa
21m 54s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp0-3
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
48104
Finished
-
rickstaa
21m 46s
-
-
nn.ReLU
nn.ReLU
[64,64]
[256,256,16]
-
nn.ReLU
-
-
true
2
1
256
gpu:1
Oscillator-v1
stable_gym.envs.biological.oscillator.oscillator.Oscillator
49
han2020_reproduction_lac_oscillator_alpha3_tune_exp_small_actor_alp1-0
false
0.99
5
0.99
0.0001
linear
1.0000e-9
0.0001
linear
1.0000e-9
0.0003
linear
3.0000e-9
step
linear
0.0003
constant
3.0000e-9
400
10
minimize
0.995
1000000
10
567
Finished
-
rickstaa
59m 48s
-
-
nn.ReLU
nn.ReLU
[64,64]
[64,64,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
FetchReachCost-v1
stable_gym.envs.robotics.fetch.fetch_reach_cost.fetch_reach_cost.FetchReachCost
147
han2020_reproduction_lac_fetch_reach_alpha3_tune_infinite_horizon_exp_small_actor_alp0-3
false
0.995
0
0.99
0.0001
linear
3.3333e-10
0.0001
linear
3.3333e-10
0.0003
linear
1.0000e-9
step
linear
0.0003
constant
1.0000e-9
200
10
minimize
0.995
1000000
10
234
Finished
-
rickstaa
59m 32s
-
-
nn.ReLU
nn.ReLU
[64,64]
[64,64,16]
-
nn.ReLU
-
-
true
2
0.1
256
gpu:1
FetchReachCost-v1
stable_gym.envs.robotics.fetch.fetch_reach_cost.fetch_reach_cost.FetchReachCost
147
han2020_reproduction_lac_fetch_reach_alpha3_tune_infinite_horizon_exp_small_actor_alp0-1
false
0.995
0
0.99
0.0001
linear
3.3333e-10
0.0001
linear
3.3333e-10
0.0003
linear
1.0000e-9
step
linear
0.0003
constant
1.0000e-9
200
10
minimize
0.995
1000000
10
3658
Finished
-
rickstaa
59m 48s
-
-
nn.ReLU
nn.ReLU
[64,64]
[64,64,16]
-
nn.ReLU
-
-
true
2
1
256
gpu:1
FetchReachCost-v1
stable_gym.envs.robotics.fetch.fetch_reach_cost.fetch_reach_cost.FetchReachCost
147
han2020_reproduction_lac_fetch_reach_alpha3_tune_infinite_horizon_exp_small_actor_alp1-0
false
0.995
0
0.99
0.0001
linear
3.3333e-10
0.0001
linear
3.3333e-10
0.0003
linear
1.0000e-9
step
linear
0.0003
constant
1.0000e-9
200
10
minimize
0.995
1000000
10
78456
Finished
-
rickstaa
59m 35s
-
-
nn.ReLU
nn.ReLU
[64,64]
[64,64,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
FetchReachCost-v1
stable_gym.envs.robotics.fetch.fetch_reach_cost.fetch_reach_cost.FetchReachCost
147
han2020_reproduction_lac_fetch_reach_alpha3_tune_infinite_horizon_exp_small_actor_alp0-3
false
0.995
0
0.99
0.0001
linear
3.3333e-10
0.0001
linear
3.3333e-10
0.0003
linear
1.0000e-9
step
linear
0.0003
constant
1.0000e-9
200
10
minimize
0.995
1000000
10
48104
Finished
-
rickstaa
59m 40s
-
-
nn.ReLU
nn.ReLU
[64,64]
[64,64,16]
-
nn.ReLU
-
-
true
2
0.3
256
gpu:1
FetchReachCost-v1
stable_gym.envs.robotics.fetch.fetch_reach_cost.fetch_reach_cost.FetchReachCost
147
han2020_reproduction_lac_fetch_reach_alpha3_tune_infinite_horizon_exp_small_actor_alp0-3
false
0.995
0
0.99
0.0001
linear
3.3333e-10
0.0001
linear
3.3333e-10
0.0003
linear
1.0000e-9
step
linear
0.0003
constant
1.0000e-9
200
10
minimize
0.995
1000000
10
567
1-20
of 75