Scottemmons's workspace
Runs
135
Name
30 visualized
env: antmaze-medium-diverse-v2
env: antmaze-medium-diverse-v2
5
env: antmaze-medium-play-v2
env: antmaze-medium-play-v2
5
env: antmaze-umaze-diverse-v2
env: antmaze-umaze-diverse-v2
5
env: antmaze-umaze-v2
env: antmaze-umaze-v2
5
env: antmaze-large-diverse-v2
env: antmaze-large-diverse-v2
5
env: antmaze-large-play-v2
env: antmaze-large-play-v2
5
State
Notes
User
Tags
Created
Runtime
Sweep
batch_size
cql.alpha_multiplier
cql.backup_entropy
cql.cql_importance_sample
cql.cql_lagrange
cql.cql_min_q_weight
cql.cql_n_actions
cql.cql_target_action_gap
cql.cql_temp
cql.discount
cql.optimizer_type
cql.policy_lr
cql.qf_lr
cql.reward_scale
cql.soft_target_update_rate
cql.target_entropy
cql.target_update_period
cql.use_automatic_entropy_tuning
cql.use_cql
device
env
eval_n_trajs
eval_period
hostname
logging.online
logging.output_dir
logging.prefix
logging.project
logging.random_delay
max_traj_length
n_epochs
n_train_step_per_epoch
policy_arch
policy_log_std_multiplier
policy_log_std_offset
qf_arch
replay_buffer_size
save_model
seed
average_normalizd_return
average_return
average_traj_length
epoch
epoch_time
Finished
-
scottemmons
1d 14m 34s
-
256
1
false
true
true
5
10
5
1
0.99
adam
0.0001
0.0003
1
0.005
0
1
true
true
cuda
antmaze-medium-diverse-v2
100
100
["n0175.savio3","n0176.savio3"]
true
./experiment_output
SimpleSAC
cql
0
1000
2000
1000
256-256-256
1
-1
256-256-256
1000000
false
2
0
0
1000
1999
337.90225
Finished
-
scottemmons
1d 9m 53s
-
256
1
false
true
true
5
10
5
1
0.99
adam
0.0001
0.0003
1
0.005
0
1
true
true
cuda
antmaze-medium-play-v2
100
100
["n0175.savio3","n0176.savio3"]
true
./experiment_output
SimpleSAC
cql
0
1000
2000
1000
256-256-256
1
-1
256-256-256
1000000
false
2
0
0
1000
1999
390.5344
Finished
-
scottemmons
22h 50m 39s
-
256
1
false
true
true
5
10
5
1
0.99
adam
0.0001
0.0003
1
0.005
0
1
true
true
cuda
antmaze-umaze-diverse-v2
100
100
["n0175.savio3","n0176.savio3"]
true
./experiment_output
SimpleSAC
cql
0
700
2000
1000
256-256-256
1
-1
256-256-256
1000000
false
2
0.48
0.48
509.814
1999
330.96559
Finished
-
scottemmons
22h 42m 14s
-
256
1
false
true
true
5
10
5
1
0.99
adam
0.0001
0.0003
1
0.005
0
1
true
true
cuda
antmaze-umaze-v2
100
100
["n0175.savio3","n0176.savio3"]
true
./experiment_output
SimpleSAC
cql
0
700
2000
1000
256-256-256
1
-1
256-256-256
1000000
false
2
0.254
0.254
585.404
1999
303.76952
Finished
-
scottemmons
1d 2h 28m 53s
-
256
1
false
true
true
5
10
5
1
0.99
adam
0.0001
0.0003
1
0.005
0
1
true
true
cuda
antmaze-large-diverse-v2
100
100
n0176.savio3
true
./experiment_output
SimpleSAC
cql
0
1000
2000
1000
256-256-256
1
-1
256-256-256
1000000
false
2
0
0
1000
1999
292.74242
Finished
-
scottemmons
1d 2h 48m 10s
-
256
1
false
true
true
5
10
5
1
0.99
adam
0.0001
0.0003
1
0.005
0
1
true
true
cuda
antmaze-large-play-v2
100
100
n0176.savio3
true
./experiment_output
SimpleSAC
cql
0
1000
2000
1000
256-256-256
1
-1
256-256-256
1000000
false
2
0
0
1000
1999
319.56179
1-6
of 6