Clabornd's group workspace
Group: train_2023-07-13_05-28-51
Name
0 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
actor_lr
batch_size
buffer_size
critic_lr
epochs
eps
explore_0
explore_decay
gamma
lam
min_explore
run_id
samples_per_epoch
trial_log_path
wandb.project
epoch_avg_rew
Finished
-
clabornd
55m 43s
-
0.00065
256
20000
0.0007
100
0.11808
0.95
0.95
0.98406
0.93518
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00031_31_buffer_size=20000,eps=0.1181,gamma=0.9841,lam=0.9352_2023-07-13_08-24-02
ppo-basic
-
Finished
-
clabornd
59m 51s
-
0.00065
256
10000
0.0007
100
0.11831
0.95
0.95
0.98719
0.9173
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00030_30_buffer_size=10000,eps=0.1183,gamma=0.9872,lam=0.9173_2023-07-13_08-20-12
ppo-basic
-
Finished
-
clabornd
1h 1m 36s
-
0.00065
256
20000
0.0007
100
0.17912
0.95
0.95
0.9829
0.99443
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00029_29_buffer_size=20000,eps=0.1791,gamma=0.9829,lam=0.9944_2023-07-13_08-18-55
ppo-basic
-
Finished
-
clabornd
1h 58s
-
0.00065
256
10000
0.0007
100
0.13245
0.95
0.95
0.99817
0.96013
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00028_28_buffer_size=10000,eps=0.1325,gamma=0.9982,lam=0.9601_2023-07-13_08-18-04
ppo-basic
-
Finished
-
clabornd
59m 30s
-
0.00065
256
20000
0.0007
100
0.14561
0.95
0.95
0.99967
0.91065
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00027_27_buffer_size=20000,eps=0.1456,gamma=0.9997,lam=0.9106_2023-07-13_07-26-27
ppo-basic
-
Finished
-
clabornd
57m 9s
-
0.00065
256
10000
0.0007
100
0.1822
0.95
0.95
0.99057
0.9356
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00026_26_buffer_size=10000,eps=0.1822,gamma=0.9906,lam=0.9356_2023-07-13_07-23-24
ppo-basic
-
Finished
-
clabornd
58m 48s
-
0.00065
256
20000
0.0007
100
0.19651
0.95
0.95
0.99169
0.92188
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00025_25_buffer_size=20000,eps=0.1965,gamma=0.9917,lam=0.9219_2023-07-13_07-23-03
ppo-basic
-
Finished
-
clabornd
57m 18s
-
0.00065
256
10000
0.0007
100
0.1977
0.95
0.95
0.98568
0.97065
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00024_24_buffer_size=10000,eps=0.1977,gamma=0.9857,lam=0.9707_2023-07-13_07-22-23
ppo-basic
-
Finished
-
clabornd
58m 55s
-
0.00065
256
20000
0.0007
100
0.10908
0.95
0.95
0.99211
0.93653
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00023_23_buffer_size=20000,eps=0.1091,gamma=0.9921,lam=0.9365_2023-07-13_06-27-13
ppo-basic
-
Finished
-
clabornd
56m 26s
-
0.00065
256
10000
0.0007
100
0.1598
0.95
0.95
0.98217
0.99231
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00022_22_buffer_size=10000,eps=0.1598,gamma=0.9822,lam=0.9923_2023-07-13_06-27-01
ppo-basic
-
Finished
-
clabornd
58m 26s
-
0.00065
256
20000
0.0007
100
0.11627
0.95
0.95
0.99893
0.93262
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00021_21_buffer_size=20000,eps=0.1163,gamma=0.9989,lam=0.9326_2023-07-13_06-25-26
ppo-basic
-
Finished
-
clabornd
57m 7s
-
0.00065
256
10000
0.0007
100
0.10075
0.95
0.95
0.98913
0.9922
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00020_20_buffer_size=10000,eps=0.1008,gamma=0.9891,lam=0.9922_2023-07-13_06-25-23
ppo-basic
-
Finished
-
clabornd
59m 48s
-
0.00065
256
20000
0.0007
100
0.1911
0.95
0.95
0.98447
0.96739
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00019_19_buffer_size=20000,eps=0.1911,gamma=0.9845,lam=0.9674_2023-07-13_05-29-01
ppo-basic
-
Finished
-
clabornd
57m 30s
-
0.00065
256
10000
0.0007
100
0.11604
0.95
0.95
0.98231
0.97284
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00018_18_buffer_size=10000,eps=0.1160,gamma=0.9823,lam=0.9728_2023-07-13_05-29-01
ppo-basic
-
Finished
-
clabornd
59m
-
0.00065
256
20000
0.0007
100
0.16744
0.95
0.95
0.9842
0.91385
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00017_17_buffer_size=20000,eps=0.1674,gamma=0.9842,lam=0.9139_2023-07-13_05-29-00
ppo-basic
-
Finished
-
clabornd
57m 19s
-
0.00065
256
10000
0.0007
100
0.13543
0.95
0.95
0.99761
0.92766
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00016_16_buffer_size=10000,eps=0.1354,gamma=0.9976,lam=0.9277_2023-07-13_05-29-00
ppo-basic
-
Finished
-
clabornd
59m 39s
-
0.00065
256
20000
0.0007
100
0.13386
0.95
0.95
0.98171
0.95952
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00015_15_buffer_size=20000,eps=0.1339,gamma=0.9817,lam=0.9595_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
56m 20s
-
0.00065
256
10000
0.0007
100
0.11414
0.95
0.95
0.99161
0.97532
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00014_14_buffer_size=10000,eps=0.1141,gamma=0.9916,lam=0.9753_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
58m 52s
-
0.00065
256
20000
0.0007
100
0.15095
0.95
0.95
0.98077
0.92136
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00013_13_buffer_size=20000,eps=0.1510,gamma=0.9808,lam=0.9214_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
56m 58s
-
0.00065
256
10000
0.0007
100
0.19203
0.95
0.95
0.99694
0.97774
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00012_12_buffer_size=10000,eps=0.1920,gamma=0.9969,lam=0.9777_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
57m 36s
-
0.00065
256
20000
0.0007
100
0.11899
0.95
0.95
0.99047
0.92019
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00011_11_buffer_size=20000,eps=0.1190,gamma=0.9905,lam=0.9202_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
55m 31s
-
0.00065
256
10000
0.0007
100
0.18374
0.95
0.95
0.98904
0.94311
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00010_10_buffer_size=10000,eps=0.1837,gamma=0.9890,lam=0.9431_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
57m 9s
-
0.00065
256
20000
0.0007
100
0.17232
0.95
0.95
0.9897
0.90741
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00009_9_buffer_size=20000,eps=0.1723,gamma=0.9897,lam=0.9074_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
55m 42s
-
0.00065
256
10000
0.0007
100
0.11545
0.95
0.95
0.98339
0.9133
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00008_8_buffer_size=10000,eps=0.1155,gamma=0.9834,lam=0.9133_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
59m 14s
-
0.00065
256
20000
0.0007
100
0.15774
0.95
0.95
0.98631
0.9815
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00007_7_buffer_size=20000,eps=0.1577,gamma=0.9863,lam=0.9815_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
56m 2s
-
0.00065
256
10000
0.0007
100
0.15663
0.95
0.95
0.98758
0.96405
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00006_6_buffer_size=10000,eps=0.1566,gamma=0.9876,lam=0.9640_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
57m 59s
-
0.00065
256
20000
0.0007
100
0.16606
0.95
0.95
0.996
0.95694
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00005_5_buffer_size=20000,eps=0.1661,gamma=0.9960,lam=0.9569_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
57m 1s
-
0.00065
256
10000
0.0007
100
0.17471
0.95
0.95
0.98655
0.97575
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00004_4_buffer_size=10000,eps=0.1747,gamma=0.9865,lam=0.9758_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
57m 57s
-
0.00065
256
20000
0.0007
100
0.13997
0.95
0.95
0.98788
0.93752
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00001_1_buffer_size=20000,eps=0.1400,gamma=0.9879,lam=0.9375_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
58m 11s
-
0.00065
256
20000
0.0007
100
0.19528
0.95
0.95
0.98958
0.92172
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00003_3_buffer_size=20000,eps=0.1953,gamma=0.9896,lam=0.9217_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
56m 21s
-
0.00065
256
10000
0.0007
100
0.15079
0.95
0.95
0.99303
0.97414
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00002_2_buffer_size=10000,eps=0.1508,gamma=0.9930,lam=0.9741_2023-07-13_05-28-55
ppo-basic
-
Finished
-
clabornd
56m 25s
-
0.00065
256
10000
0.0007
100
0.18846
0.95
0.95
0.99748
0.97209
0.05
-
10000
/root/ray_results/train_2023-07-13_05-28-51/train_28c8a_00000_0_buffer_size=10000,eps=0.1885,gamma=0.9975,lam=0.9721_2023-07-13_05-28-55
ppo-basic
-
1-32
of 32