Cstorm125's workspace
Runs
19
Name
7 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_n_gpu
_name_or_path
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_probs_dropout_prob
bos_token_id
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_find_unused_parameters
debug
deepspeed
directionality
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
early_stopping
encoder_no_repeat_ngram_size
eos_token_id
eval_accumulation_steps
eval_batch_size
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
gradient_accumulation_steps
gradient_checkpointing
greater_is_better
group_by_length
hidden_act
hidden_dropout_prob
hidden_size
id2label.0
id2label.1
Finished
-
cstorm125
chimera_qa
13m 57s
-
1
xlm-roberta-base
false
0.9
0.999
1.0000e-8
false
["XLMRobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
chimera_qa
25m 56s
-
1
airesearch/wangchan-deberta_v1-base-wiki-20210520-news-spm
false
0.9
0.999
1.0000e-8
false
["DebertaForMaskedLM"]
0.1
-
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
-
None
16
10
epoch
true
auto
false
O1
1
-
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
chimera_qa
15m 6s
-
1
airesearch/wangchanberta-base-wiki-20210520-news-spm_span-mask
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
chimera_qa
14m 58s
-
1
airesearchth/wangchanberta-base-wiki-20210520-news-spm
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
chimera_qa
15m 23s
-
1
airesearchth/wangchanberta-base-wiki-20210520-spm
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
chimera_qa
11m 24s
-
1
airesearch/wangchanberta-base-att-spm-uncased
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
chimera_qa
25m 59s
-
1
bert-base-multilingual-cased
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
0.1
-
0
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
false
0
-
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_xquad
18m 3s
-
1
airesearchth/wangchanberta-base-wiki-20210520-news-spm
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_xquad
18m 3s
-
1
airesearchth/wangchanberta-base-wiki-20210520-spm
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_xquad
13m 21s
-
1
airesearch/wangchanberta-base-att-spm-uncased
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_xquad
30m 47s
-
1
bert-base-multilingual-cased
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
0.1
-
0
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
false
0
-
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_xquad
16m 16s
-
1
xlm-roberta-base
false
0.9
0.999
1.0000e-8
false
["XLMRobertaForMaskedLM"]
0.1
0
0
false
0
true
None
[]
None
-
false
0
true
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_v1
14m 40s
-
1
airesearchth/wangchanberta-base-wiki-20210520-spm
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
false
None
-
false
0
None
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_v1
23m 58s
-
1
bert-base-multilingual-cased
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
0.1
-
0
false
0
true
None
false
None
bidi
false
0
None
false
false
false
false
0
-
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_v1
12m 16s
-
1
xlm-roberta-base
false
0.9
0.999
1.0000e-8
false
["XLMRobertaForMaskedLM"]
0.1
0
0
false
0
true
None
false
None
-
false
0
None
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiqa_v1
10m 2s
-
1
airesearch/wangchanberta-base-att-spm-uncased
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
false
None
-
false
0
None
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiq_v2
24m 15s
-
1
bert-base-multilingual-cased
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM"]
0.1
-
0
false
0
true
None
false
None
bidi
false
0
None
false
false
false
false
0
-
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiq_v2
12m 28s
-
1
xlm-roberta-base
false
0.9
0.999
1.0000e-8
false
["XLMRobertaForMaskedLM"]
0.1
0
0
false
0
true
None
false
None
-
false
0
None
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
Finished
-
cstorm125
iapp_thaiq_v2
10m 10s
-
1
airesearch/wangchanberta-base-att-spm-uncased
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
0
0
false
0
true
None
false
None
-
false
0
None
false
false
false
false
0
2
None
16
10
epoch
true
auto
false
O1
1
false
false
false
gelu
0.1
768
LABEL_0
LABEL_1
1-19
of 19