Mwritescode's workspace
Runs
141
Name
141 visualized
eval_episode_return.mean
802.88095
860.80174
671.11342
494.5735
765.87074
833.05785
797.60492
248.15504
Created
Runtime
Group
End Time
Hostname
ID
Notes
State
Updated
Tags
AGENT.AUGMENT
AGENT.BATCH_SIZE
AGENT.BETA
AGENT.BUFFER_SIZE
AGENT.CLIP_REWARDS
AGENT.DISCOUNT_FACTOR
AGENT.DOUBLE
AGENT.DUELING
AGENT.EPS_ANNEALING_STEPS
AGENT.EPS_END
AGENT.EPS_EVAL
AGENT.EPS_START
AGENT.EVALUATE_AFTER
AGENT.EVALUATION_EPISODES
AGENT.LOG_TABLE
AGENT.LOG_TABLE_PERIOD
AGENT.MAX_EPISODE_FRAMES
AGENT.MAX_TRAIN_FRAMES
AGENT.NOISY_NETS
AGENT.NUM_UPDATES_PER_STEP
AGENT.PLAY_RANDOMLY
AGENT.PRIORITIZED_REPLAY
AGENT.RECORD_VIDEO
AGENT.TAU
AGENT.UPDATE_TAGRET_AFTER
AGENT.USE_TARGET
AGENT.WARMUP_FRAMES
EVALUATION.CHECKPOINT_PATH
EVALUATION.MAX_FRAMES
EVALUATION.SEED
EVALUATION.SEEDS
EVALUATION.WANDB.GROUP
EVALUATION.WANDB.NAME
EVALUATION.WANDB.PROJECT
TRAINING.CHECKPOINT_PATH
TRAINING.CLIPNORM
TRAINING.LEARNING_RATE
TRAINING.LOSS
TRAINING.SEED
TRAINING.SEEDS
AGENT.VGG
1d 12h 33m 56s
multi-update
Aug 20 '22 20:16
-
multi-update
-
Finished
Jan 01 '70 00:00
true
32
0.4
100000
true
0.99
true
true
50000
0.01
0.001
1
5000
5
true
100
108000
73888.88889
true
5.11111
false
true
true
0.99
1
true
9000
["checkpoints/multi_update-1/multi_update-1.ckpt","checkpoints/multi_update-2/multi_update-2.ckpt","checkpoints/multi_update-3/multi_update-3.ckpt"]
125000
204.4
204.4
multi-update
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/multi_update-1/multi_update-1.ckpt","checkpoints/multi_update-2/multi_update-2.ckpt","checkpoints/multi_update-3/multi_update-3.ckpt"]
10
0.0000625
huber
2
2
false
2d 5h 51m 23s
augmented-dr.q
Aug 19 '22 18:18
-
augmented-dr.q
-
Finished
Jan 01 '70 00:00
true
32
0.4
100000
true
0.99
true
true
50000
0.01
0.001
1
5000
5
true
100
108000
100000
true
1
false
true
true
0.99
1
true
20000
["checkpoints/augment-1/augment-1.ckpt","checkpoints/augment-2/augment-2.ckpt","checkpoints/augment-3/augment-3.ckpt"]
125000
204.4
204.4
augmented-dr.q
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/augment-1/augment-1.ckpt","checkpoints/augment-2/augment-2.ckpt","checkpoints/augment-3/augment-3.ckpt"]
10
0.0000625
huber
2
2
-
3d 4h 17m 51s
default-dqn
Aug 19 '22 15:40
-
default-dqn
-
Finished
Jan 01 '70 00:00
false
32
0.4
100000
true
0.99
false
false
50000
0.01
0.001
1
5000
5
true
100
108000
100000
false
1
false
false
true
0.99
1
true
20000
["checkpoints/default_dqn-1/default_dqn-1.ckpt","checkpoints/default_dqn-2/default_dqn-2.ckpt","checkpoints/default_dqn-3/default_dqn-3.ckpt"]
125000
204.4
204.4
default-dqn
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/default_dqn-1/default_dqn-1.ckpt","checkpoints/default_dqn-2/default_dqn-2.ckpt","checkpoints/default_dqn-3/default_dqn-3.ckpt"]
10
0.0000625
huber
2
2
-
2d 9h 32m 15s
dueling-dqn
Aug 19 '22 09:45
-
dueling-dqn
-
Finished
Jan 01 '70 00:00
false
32
0.4
100000
true
0.99
true
true
50000
0.01
0.001
1
5000
5
true
100
108000
100000
false
1
false
true
true
0.99
1
true
20000
["checkpoints/dueling-1/dueling-1.ckpt","checkpoints/dueling-2/dueling-2.ckpt","checkpoints/dueling-3/dueling-3.ckpt"]
125000
204.4
204.4
dueling-dqn
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/dueling-1/dueling-1.ckpt","checkpoints/dueling-2/dueling-2.ckpt","checkpoints/dueling-3/dueling-3.ckpt"]
10
0.0000625
huber
2
2
-
2d 15h 56m 2s
prioritized-replay
Aug 19 '22 13:38
-
prioritized-replay
-
Finished
Jan 01 '70 00:00
false
32
0.4
100000
true
0.99
true
false
50000
0.01
0.001
1
5000
5
true
100
108000
100000
false
1
false
true
true
0.99
1
true
20000
["checkpoints/prioritized_replay-1/prioritized_replay-1.ckpt","checkpoints/prioritized_replay-2/prioritized_replay-2.ckpt","checkpoints/prioritized_replay-3/prioritized_replay-3.ckpt"]
125000
204.4
204.4
prioritized-replay
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/prioritized_replay-1/prioritized_replay-1.ckpt","checkpoints/prioritized_replay-2/prioritized_replay-2.ckpt","checkpoints/prioritized_replay-3/prioritized_replay-3.ckpt"]
10
0.0000625
huber
2
2
-
2d 2h 45m 31s
noisy-nets
Aug 19 '22 12:00
-
noisy-nets
-
Finished
Jan 01 '70 00:00
false
32
0.4
100000
true
0.99
true
true
50000
0.01
0.001
1
5000
5
true
100
108000
100000
true
1
false
true
true
0.99
1
true
20000
["checkpoints/noisy_nets-1/noisy_nets-1.ckpt","checkpoints/noisy_nets-2/noisy_nets-2.ckpt","checkpoints/noisy_nets-3/noisy_nets-3.ckpt"]
125000
204.4
204.4
noisy-nets
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/noisy_nets-1/noisy_nets-1.ckpt","checkpoints/noisy_nets-2/noisy_nets-2.ckpt","checkpoints/noisy_nets-3/noisy_nets-3.ckpt"]
10
0.0000625
huber
2
2
-
2d 20h 44m 26s
double-dqn
Aug 19 '22 10:18
-
double-dqn
-
Finished
Jan 01 '70 00:00
false
32
0.4
100000
true
0.99
true
false
50000
0.01
0.001
1
5000
5
true
100
108000
100000
false
1
false
false
true
0.99
1
true
20000
["checkpoints/double-1/double-1.ckpt","checkpoints/double-2/double-2.ckpt","checkpoints/double-3/double-3.ckpt"]
125000
204.4
219.30435
double-dqn
["eval-1","eval-2","eval-3"]
data-efficient-rl
["checkpoints/double-1/double-1.ckpt","checkpoints/double-2/double-2.ckpt","checkpoints/double-3/double-3.ckpt"]
10
0.0000625
huber
2
2
-
46m 25s
random
Aug 18 '22 10:41
-
random
-
Finished
Jan 01 '70 00:00
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
checkpoints/run-name
125000
194.53333
194.53333
random
eval-
data-efficient-rl
-
-
-
-
-
-
-
1-8
of 8