Brianferrell78's workspace
Runs
45
Name
45 visualized
State
Notes
Runtime
Tags
Created
mcc
Training loss
eval_loss
adafactor_clip_threshold
adafactor_decay_rate
adafactor_eps
adam_epsilon
custom_layer_parameters
eval_batch_size
labels_list
max_seq_length
model_class
model_name
model_type
num_train_epochs
optimizer
scheduler
sliding_window
stride
train_batch_size
wandb_project
warmup_ratio
warmup_steps
weight_decay
train_loss
Finished
32m 58s
0.97942
0.000044204
0.31559
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.000044204
Finished
32m 49s
0.96422
0.00025744
0.34466
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00025744
Finished
32m 54s
0.98978
0.000054919
0.23374
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.000054919
Finished
32m 54s
0.98976
0.00014153
0.23719
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00014153
Finished
33m 5s
0.9647
0.0000495
0.46406
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.0000495
Finished
32m 53s
0.98459
0.000059496
0.24835
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.000059496
Finished
32m 59s
0.97459
0.000043178
0.36664
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.000043178
Finished
35m 20s
0.97961
0.000059628
0.33015
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.000059628
Finished
33m 28s
0.98972
0.00016534
0.25167
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00016534
Finished
33m 15s
0.98467
0.00019344
0.30127
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00019344
Finished
33m 9s
0.97447
0.00023943
0.33042
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00023943
Finished
33m 34s
0.9796
0.000089248
0.2902
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.000089248
Finished
33m 16s
0.97951
0.00012973
0.28585
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00012973
Finished
34m 11s
0.98972
0.00011443
0.22856
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.00011443
Finished
34m 40s
0.94356
0.017932
0.31612
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
5
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
323
0
0.017932
Finished
26m 45s
0.97952
0.000086248
0.24799
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00011159
Finished
26m 51s
0.97953
0.000088653
0.29815
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00011482
Finished
26m 55s
0.98462
0.00010411
0.29025
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00013678
Finished
27m 1s
0.97433
0.00011687
0.23812
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.0013871
Finished
26m 54s
0.97962
0.000082944
0.26363
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.000094583
Finished
26m 55s
0.97948
0.00011182
0.3853
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00018765
Finished
26m 42s
0.99487
0.000091834
0.24677
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00011636
Finished
27m
0.98462
0.00011108
0.2237
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.0002935
Finished
27m 7s
0.97942
0.00010054
0.19839
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00051066
Finished
27m 2s
0.97433
0.00013022
0.23699
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.0081902
Finished
27m 24s
0.97433
0.00014355
0.25768
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00015723
Finished
27m 1s
0.97447
0.00012127
0.27358
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.00062607
Finished
27m 59s
0.98459
0.00045824
0.24154
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.035652
Finished
28m 14s
0.97947
0.00043054
0.23547
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.087427
Finished
28m 25s
0.90781
0.072666
0.38045
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
4
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
259
0
0.22694
Finished
21m 37s
0.97945
0.00019547
0.25062
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00015832
Finished
20m 33s
0.97438
0.0012192
0.25537
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00016266
Finished
20m 41s
0.98456
0.00022529
0.19963
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00014471
Finished
20m 52s
0.98456
0.00022463
0.20323
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00014916
Finished
20m 42s
0.97952
0.00019903
0.33695
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00013118
Finished
20m 44s
0.97428
0.00026176
0.24614
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00019392
Finished
21m 14s
0.98459
0.00023145
0.20765
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00017417
Finished
21m 16s
0.98456
0.00031787
0.20141
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00014025
Finished
20m 47s
0.96915
0.00052258
0.19648
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00017465
Finished
20m 57s
0.97427
0.00058135
0.20974
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00001},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00019237
Finished
20m 47s
0.98456
0.00050785
0.21
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00022824
Finished
21m 16s
0.97947
0.00045277
0.19658
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00002},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00017307
Finished
21m 54s
0.97947
0.0011196
0.21317
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004},{"lr":0.00004}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.00018935
Finished
25m 12s
0.97947
0.0014066
0.22727
1
-0.8
[9.999999999999999e-31,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003},{"lr":0.00003}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.0002399
Finished
25m 18s
0.82321
0.1261
0.49162
1
-0.8
[1e-30,0.001]
1.0000e-8
[{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0},{"lr":0}]
8
[0,1,2]
128
ClassificationModel
bert-base-uncased
bert
3
AdamW
linear_schedule_with_warmup
true
0.8
32
Fine-Tuning_BERT
0.06
194
0
0.15095
1-45
of 45