Pszemraj's workspace
Runs
620
Name
480 visualized
eval/accuracy
eval/combined_score
eval/matthews_correlation
train/epoch
0.52708
-
-
2.93
0.46479
-
-
2.72
0.68137
0.74593
-
2.98
-
0.056742
-
2.97
-
-
0
2.99
0.54513
-
-
2.92
0.40845
-
-
3
0.68382
0.74803
-
2.93
-
0.020967
-
2.94
-
-
0
2.96
-
-
-0.011355
3
0.54
-
-
3
0.598
-
-
3
0.762
0.70124
-
3
0.732
-
-
3
0.51264
-
-
2.92
0.57746
-
-
3
0.68382
0.74803
-
2.92
-
-0.086519
-
3
-
-
0
3
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
accelerator_config.even_batches
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
activation
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
add_lm_hidden_dense_layer
add_token_type_embeddings
architectures
attention_activation
attention_dropout
attention_mode
attention_probs_dropout_prob
attention_type
attention_window
auto_find_batch_size
bf16
bf16_full_eval
bidirectional
block_size
bos_token_id
chunk_size
chunk_size_feed_forward
classifier_dropout
cls_token_id
conv_kernel_size
dataloader_drop_last
dataloader_num_workers
dataloader_persistent_workers
dataloader_pin_memory
ddp_timeout
debug
dim
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
dropout
Finished
-
pszemraj
7m 54s
-
pszemraj/pile-t5-large-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
1m 57s
-
pszemraj/pile-t5-large-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
11m 46s
-
pszemraj/pile-t5-large-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
18m 1s
-
pszemraj/pile-t5-large-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
26m 31s
-
pszemraj/pile-t5-large-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
2m 56s
-
pszemraj/pile-t5-base-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
51s
-
pszemraj/pile-t5-base-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
4m 14s
-
pszemraj/pile-t5-base-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
6m 32s
-
pszemraj/pile-t5-base-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
9m 36s
-
pszemraj/pile-t5-base-fixed
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["T5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
6m 50s
-
EleutherAI/pile-t5-base
true
false
true
-
false
0.9
0.999
1.0000e-8
false
-
-
["UMT5ForConditionalGeneration"]
-
-
-
-
-
-
false
false
false
-
-
-
-
0
0
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
24m 18s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
false
1800
[]
-
false
0
true
true
false
true
-
Finished
-
pszemraj
7m 27s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
false
1800
[]
-
false
0
true
true
false
true
-
Finished
-
pszemraj
26m 2s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
false
1800
[]
-
false
0
true
true
false
true
-
Finished
-
pszemraj
6m 10s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
false
1800
[]
-
false
0
true
true
false
true
-
Finished
-
pszemraj
15s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
7s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
22s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
30s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
Finished
-
pszemraj
40s
-
mnaylor/mega-base-wikitext
true
false
true
silu
false
0.9
0.999
1.0000e-8
false
false
false
["MegaForMaskedLM"]
softmax
-
-
0.1
-
-
false
false
false
true
-
0
-1
0
-
-
-
false
0
false
true
1800
[]
-
false
0
true
false
false
true
-
1-20
of 480