Clabornd's group workspace
Group: train_2023-07-08_23-06-44
Name
0 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
actor_lr
batch_size
buffer_size
critic_lr
epochs
eps
explore_0
explore_decay
gamma
lam
min_explore
run_id
samples_per_epoch
trial_log_path
wandb.project
epoch_avg_rew
Finished
-
clabornd
1h 2m 47s
-
0.00066187
256
50000
0.0008655
100
0.17301
0.95
0.95
0.98185
0.6525
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00015_15_actor_lr=0.0007,critic_lr=0.0009,eps=0.1730,gamma=0.9818,lam=0.6525_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 39s
-
0.00090197
256
50000
0.00073883
100
0.17164
0.95
0.95
0.99147
0.60314
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00014_14_actor_lr=0.0009,critic_lr=0.0007,eps=0.1716,gamma=0.9915,lam=0.6031_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 3m 42s
-
0.00089136
256
50000
0.00055754
100
0.24607
0.95
0.95
0.98986
0.65038
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00013_13_actor_lr=0.0009,critic_lr=0.0006,eps=0.2461,gamma=0.9899,lam=0.6504_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 3m 37s
-
0.0006396
256
50000
0.00088588
100
0.063693
0.95
0.95
0.98812
0.5003
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00012_12_actor_lr=0.0006,critic_lr=0.0009,eps=0.0637,gamma=0.9881,lam=0.5003_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 15s
-
0.00089902
256
50000
0.00071665
100
0.077951
0.95
0.95
0.99498
0.58277
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00011_11_actor_lr=0.0009,critic_lr=0.0007,eps=0.0780,gamma=0.9950,lam=0.5828_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 50s
-
0.00084544
256
50000
0.00067608
100
0.18227
0.95
0.95
0.99776
0.85566
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00010_10_actor_lr=0.0008,critic_lr=0.0007,eps=0.1823,gamma=0.9978,lam=0.8557_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 30s
-
0.00069503
256
50000
0.00093445
100
0.2128
0.95
0.95
0.98952
0.61214
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00009_9_actor_lr=0.0007,critic_lr=0.0009,eps=0.2128,gamma=0.9895,lam=0.6121_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 44s
-
0.00086112
256
50000
0.00057965
100
0.23581
0.95
0.95
0.99838
0.72031
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00008_8_actor_lr=0.0009,critic_lr=0.0006,eps=0.2358,gamma=0.9984,lam=0.7203_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 10s
-
0.00070047
256
50000
0.00055504
100
0.1198
0.95
0.95
0.98038
0.56701
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00007_7_actor_lr=0.0007,critic_lr=0.0006,eps=0.1198,gamma=0.9804,lam=0.5670_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 5m 19s
-
0.00071495
256
50000
0.00076181
100
0.20831
0.95
0.95
0.98601
0.8999
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00006_6_actor_lr=0.0007,critic_lr=0.0008,eps=0.2083,gamma=0.9860,lam=0.8999_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 16s
-
0.00095961
256
50000
0.00086085
100
0.091617
0.95
0.95
0.98722
0.59195
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00005_5_actor_lr=0.0010,critic_lr=0.0009,eps=0.0916,gamma=0.9872,lam=0.5920_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 5m 2s
-
0.0006308
256
50000
0.00072621
100
0.2048
0.95
0.95
0.99494
0.80734
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00004_4_actor_lr=0.0006,critic_lr=0.0007,eps=0.2048,gamma=0.9949,lam=0.8073_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 58s
-
0.00096017
256
50000
0.0007578
100
0.14541
0.95
0.95
0.98259
0.9212
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00003_3_actor_lr=0.0010,critic_lr=0.0008,eps=0.1454,gamma=0.9826,lam=0.9212_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 5s
-
0.00092202
256
50000
0.00088797
100
0.11444
0.95
0.95
0.99333
0.53544
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00000_0_actor_lr=0.0009,critic_lr=0.0009,eps=0.1144,gamma=0.9933,lam=0.5354_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 3m 35s
-
0.00054126
256
50000
0.0009489
100
0.1054
0.95
0.95
0.9858
0.63097
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00002_2_actor_lr=0.0005,critic_lr=0.0009,eps=0.1054,gamma=0.9858,lam=0.6310_2023-07-08_23-06-44
ppo-basic
-
Finished
-
clabornd
1h 4m 52s
-
0.00075278
256
50000
0.00054904
100
0.096999
0.95
0.95
0.98382
0.92676
0.05
-
10000
/root/ray_results/train_2023-07-08_23-06-44/train_1b373_00001_1_actor_lr=0.0008,critic_lr=0.0005,eps=0.0970,gamma=0.9838,lam=0.9268_2023-07-08_23-06-44
ppo-basic
-
1-16
of 16