Colinli's workspace
Runs
39
Name
2 visualized
env_name: cartpole-swingup_sparse
env_name: cartpole-swingup_sparse
2
env_name: hopper-stand
env_name: hopper-stand
5
env_name: humanoid-stand
env_name: humanoid-stand
8
env_name: hopper-hop
env_name: hopper-hop
8
env_name: humanoid-run
env_name: humanoid-run
8
env_name: fish-swim
env_name: fish-swim
8
State
Notes
User
Tags
Created
Runtime
Sweep
?
alsologtostderr
batch_size
brief_logging
chex_assert_multiple_cpu_devices
chex_n_cpu_devices
chex_skip_pmap_variant_if_single_device
collect_heldout_rb
config0
config1
config2
config3
config4
env_name
eval_episodes
eval_interval
gaussian_exploration_noise
hbm_oom_exit
heldout_evaluation_trunk_size
heldout_interval
help
helpfull
helpshort
helpxml
log_dir
log_interval
logtostderr
max_steps
mode_action
only_check_args
op_conversion_fallback_to_while_loop
pdb
pdb_post_mortem
project_name
run_with_pdb
run_with_profiling
runtime_oom_exit
save_dir
save_replay_buffer
seed
showprefixforinfo
start_training
stderrthreshold
test_random_seed
Crashed
-
colinli
25m 17s
-
false
false
256
true
false
1
true
true
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: reg-
proper_weight_decay: false
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.01
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.03
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do03-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.01
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.003
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd003-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
cartpole-swingup_sparse
10
5000
0
true
2048
10
false
false
false
false
1000
false
1000000
false
false
true
false
false
RR-09-21-multiple
false
false
true
save_dir
false
1.5
true
10000
fatal
301
Crashed
-
colinli
3h 28m 45s
-
false
false
256
true
false
1
true
true
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: reg-
proper_weight_decay: false
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.01
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.03
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do03-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.01
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.003
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd003-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
hopper-stand
10
5000
0
true
2048
10
false
false
false
false
1000
false
1000000
false
false
true
false
false
RR-09-21-multiple
false
false
true
save_dir
false
4
true
10000
fatal
301
Crashed
-
colinli
16h 18m 36s
-
false
false
256
true
false
1
true
true
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: reg-
proper_weight_decay: false
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.01
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.03
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do03-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.01
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.003
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd003-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
humanoid-stand
10
5000
0
true
2048
10
false
false
false
false
1000
false
1000000
false
false
true
false
false
RR-09-21-multiple
false
false
true
save_dir
false
3.5
true
10000
fatal
301
Crashed
-
colinli
17h 37m 21s
-
false
false
256
true
false
1
true
true
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: reg-
proper_weight_decay: false
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.01
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.03
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do03-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.01
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.003
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd003-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
hopper-hop
10
5000
0
true
2048
10
false
false
false
false
1000
false
1000000
false
false
true
false
false
RR-09-21-multiple
false
false
true
save_dir
false
3.5
true
10000
fatal
301
Finished
-
colinli
18h 53m 58s
-
false
false
256
true
false
1
true
true
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: reg-
proper_weight_decay: false
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.01
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.03
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do03-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.01
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.003
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd003-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
humanoid-run
10
5000
0
true
2048
10
false
false
false
false
1000
false
1000000
false
false
true
false
false
RR-09-21-multiple
false
false
true
save_dir
false
3.5
true
10000
fatal
301
Finished
-
colinli
17h 45m 34s
-
false
false
256
true
false
1
true
true
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: reg-
proper_weight_decay: false
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.01
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.03
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.0
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: do03-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.01
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd01-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
actor_lr: 0.0003
actor_type: tanh_normal
actor_weight_decay: 0.0
actor_weight_noise: 0.0
critic_cql_coeff: 0.0
critic_dropout_rate: 0.0
critic_feature_norm: false
critic_feature_reg_coeff: 0.0
critic_last_layer_weight_decay: 0.0
critic_layer_norm: true
critic_lr: 0.0003
critic_reduction_mode: min
critic_spectral_norm: false
critic_std_coeff: 0.0
critic_std_location: none
critic_use_acme_arch: false
critic_weight_decay: 0.003
critic_weight_decay_on_bias: false
critic_weight_decay_to_init: false
critic_weight_noise: 0.0
discount: 0.99
feature_ot_coeff: 0.0
hidden_dims: !!python/tuple
- 256
- 256
init_temperature: 1.0
model_cls: SACLearner
num_qs: 2
orthogonal_mlp: false
prefix: wd003-
proper_weight_decay: true
proper_weight_decay_not_first: false
sampled_actor_update: true
sampled_backup: true
target_entropy: null
tau: 0.005
temp_lr: 0.0003
fish-swim
10
5000
0
true
2048
10
false
false
false
false
1000
false
1000000
false
false
true
false
false
RR-09-21-multiple
false
false
true
save_dir
false
3.5
true
10000
fatal
301
1-6
of 6