Matthewfranglen's workspace
Runs
57
Name
51 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_n_gpu
_name_or_path
activation_function
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attn_pdrop
batch-size
bos_token_id
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_find_unused_parameters
debug
deepspeed
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
early_stopping
embd_pdrop
encoder_no_repeat_ngram_size
eos_token_id
epochs
eval_accumulation_steps
eval_batch_size
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
gradient_accumulation_steps
gradient_checkpointing
greater_is_better
group_by_length
id2label.0
id2label.1
Finished
-
matthewfranglen
5h 23m 41s
1
gpt2-large
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
16
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
16
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
4h 57m 59s
1
gpt2-large
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
16
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
16
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
4h 33m 21s
1
gpt2-large
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
16
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
16
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
4h 8m 32s
1
gpt2-large
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
16
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
16
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
3h 48m 42s
1
gpt2-large
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
16
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
16
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
46m 53s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
43m 14s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
39m 37s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
35m 55s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
32m 37s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
4h 52m 18s
-
1
gpt2-large
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
16
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
16
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
1h 54m 21s
-
1
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
37m 37s
-
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
2h 25m 12s
1
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
2h 14m 4s
1
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
2h 2m 18s
1
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
1h 50m 50s
1
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
1h 41m 47s
1
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
40m 31s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
Finished
-
matthewfranglen
36m 49s
1
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
32
50256
0
false
0
true
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
10
None
32
100
epoch
false
auto
false
O1
1
false
true
false
LABEL_0
LABEL_1
1-20
of 57