Mustafakeser's workspace
Runs
85
Name
85 visualized
eval/loss
-
1.92055
1.44684
-
-
-
-
1.63485
-
-
-
-
2.19679
-
1.58716
1.64362
1.71288
1.72865
1.94728
1.7184
1.94696
1.70608
1.71282
1.68664
1.71118
1.80458
1.7249
1.94656
1.70328
1.69063
1.94773
1.70514
1.7219
1.69853
1.71242
1.79021
1.36161
1.4083
1.42866
1.50151
1.31984
1.3729
1.50856
1.36515
1.50227
1.44622
1.35681
1.50151
1.31984
1.3729
1.62797
1.52678
1.75715
-
-
-
-
1.94367
-
1.3425
-
1.94623
1.59951
1.94591
1.94663
1.81356
1.63914
1.94604
1.94655
1.9462
1.94777
1.85492
1.93713
1.94615
1.94719
1.94681
1.94618
1.94604
1.82766
1.94794
1.94656
1.96609
1.96712
1.96712
-
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
activation
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_dropout
attention_probs_dropout_prob
auto_find_batch_size
batch_size
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_timeout
debug
dim
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
dropout
early_stopping
encoder_no_repeat_ngram_size
eos_token_id
epochs
eval_delay
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
fsdp
Finished
-
mustafakeser
OTHER-RUNS
55m 18s
-
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
-
false
false
-
0
false
0
true
1800
[]
-
false
0
false
false
false
false
-
false
0
-
-
0
-
no
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
26m 28s
-
bert-base-cased
gelu
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
0.1
0.1
false
-
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
32m 25s
-
bert-base-cased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
-
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
6m 35s
-
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
-
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
12m 31s
-
gpt2
-
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
-
-
false
-
false
false
50256
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
50256
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
1m 29s
-
gpt2
-
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
-
-
false
-
false
false
50256
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
50256
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
14m 13s
-
gpt2
-
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
-
-
false
-
false
false
50256
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
50256
-
0
500
steps
true
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
26m 20s
-
gpt2
-
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
-
-
false
-
false
false
50256
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
50256
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
EDA
STEPS
1h 1m 26s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
mustafakeser
EDA
STEPS
9m 55s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
mustafakeser
SPLIT
STEPS
22m 4s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
mustafakeser
SPLIT
1m 24s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
This baseline achieved 1.368 lb public score.
mustafakeser
STEPS
TRAIN
14m 3s
-
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
-
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
2m 5s
-
roberta-large
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
2h 6m 14s
-
t5-base
gelu
false
0.9
0.999
1.0000e-8
false
["T5ForConditionalGeneration"]
0.1
0.1
false
-
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
1
-
0
500
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
1h 36m 43s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
100
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 21s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 24s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 10s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 10s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 19s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
16
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 9s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 23s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 23s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 19s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
16
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 9s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 18s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
16
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 23s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 29s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 25s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 9s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 10s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 23s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 11s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
32
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 18s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
16
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS
4m 18s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
16
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
21m 39s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
9m 35s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
9m 35s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
12m 44s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
RETRAIN
TRAIN
9m 32s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
9m 33s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
10m 13s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
10m 15s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
8m 48s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
11m 10s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
9m 35s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
12m 49s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
RETRAIN
STEPS
TRAIN
9m 36s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
CV
9m 36s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
13m 15s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
100
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
11m 27s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
100
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
6m 21s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForSequenceClassification"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
1m 6s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
50
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
PREPROCESS
6m 53s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
mustafakeser
PREPROCESS
1m 14s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
mustafakeser
OTHER-RUNS
1m 4s
-
bert-base-cased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
-
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
-
0
100
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
26m 25s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
100
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
2m 29s
-
microsoft/deberta-v3-large
-
false
0.9
0.999
1.0000e-8
false
-
-
0.1
false
-
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
-
0
100
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
OTHER-RUNS
45m 46s
-
/kaggle/input/huggingfacedebertav3variants/deberta-v3-large
-
false
0.9
0.999
1.0000e-8
false
-
-
0.1
false
-
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
-
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
EDA
4m 28s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
mustafakeser
SWEEPS2
8m 27s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
4
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
7m 28s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
16
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 17s
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
16
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 54s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
4
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 46s
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
4
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 27s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 45s
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
4
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 52s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
4
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 52s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
4
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
7m 31s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
16
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 22s
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
8
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
7m 35s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
16
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 22s
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
16
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
8m 21s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
4
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
8m 18s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
4
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
7m 47s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
8
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 28s
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
8
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
4m 16s
distilbert-base-uncased
gelu
false
0.9
0.999
1.0000e-8
false
["DistilBertForMaskedLM"]
0.1
-
false
16
false
false
-
0
false
0
true
1800
[]
768
false
0
true
false
false
false
0.1
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
7m 34s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
16
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
-
mustafakeser
SWEEPS2
7m 47s
bert-base-uncased
-
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
-
0.1
false
8
false
false
-
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
-
2
0
-
epoch
false
auto
false
O1
[]
Finished
smoke test
mustafakeser
GITHUB-ACTIONS
RETRAIN
STEPS
16m 54s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
10
steps
false
auto
false
O1
[]
Finished
smoke test
mustafakeser
GITHUB-ACTIONS
RETRAIN
STEPS
9m 57s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
10
steps
false
auto
false
O1
[]
Finished
smoke test
mustafakeser
GITHUB-ACTIONS
RETRAIN
STEPS
5m 58s
-
distilroberta-base
-
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
-
0.1
false
-
false
false
0
0
false
0
true
1800
[]
-
false
0
true
false
false
false
-
false
0
2
-
0
10
steps
false
auto
false
O1
[]
Finished
-
mustafakeser
RETRAIN
38s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1-85
of 85