Aaatul's workspace
Runs
108
Name
108 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_n_gpu
_name_or_path
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_probs_dropout_prob
bos_token_id
chunk_size_feed_forward
classifier_dropout_prob
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_find_unused_parameters
debug
deepspeed
directionality
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
down_scale_factor
early_stopping
embedding_size
encoder_no_repeat_ngram_size
eos_token_id
eval_accumulation_steps
eval_batch_size
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
gap_size
gradient_accumulation_steps
gradient_checkpointing
greater_is_better
group_by_length
hidden_act
Finished
Add notes...
hassi_ahk
42m 19s
-
1
["flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.1
0
0
-
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
-
false
-
0
2
None
8
500
epoch
false
auto
false
O1
-
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
1h 42m 12s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.08
0.5
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.25
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
35m 2s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.08
0.5
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.25
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
55m 29s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.08
0.5
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.25
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Finished
Add notes...
dk-crazydiv
1h 2m 34s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.0875
0.28571
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.14286
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
1h 37m 43s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.0875
0.28571
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.14286
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Finished
Add notes...
dk-crazydiv
16m 46s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.0875
0.28571
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.14286
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Crashed
Add notes...
hassi_ahk
2d 3h 41m 57s
-
1
["flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa"]
false
0.9
0.999
1.0000e-8
false
RobertaForMaskedLM
0.1
0
0
-
false
0
true
None
[]
None
-
false
0
true
false
false
false
-
false
-
0
2
None
8
500
epoch
false
auto
false
O1
-
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
50m 54s
-
1
flax-community/roberta-pretraining-hindi
false
0.9
0.999
1.0000e-8
false
RobertaForMaskedLM
0.1
0
0
-
false
0
true
None
[]
None
-
false
0
true
false
false
false
-
false
-
0
2
None
8
500
epoch
false
auto
false
O1
-
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
1h 10m 19s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.0875
0.28571
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.14286
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Finished
Add notes...
hassi_ahk
22m 49s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.0875
0.28571
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.14286
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Crashed
Add notes...
hassi_ahk
2d 55m 45s
-
1
flax-community/roberta-pretraining-hindi
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM","RobertaForSequenceClassification"]
0.1
0
0
-
false
0
true
None
[]
None
-
false
0
true
false
false
false
-
false
-
0
2
None
8
500
epoch
false
auto
false
O1
-
1
false
None
false
gelu
Crashed
Add notes...
hassi_ahk
1d 5h 38m 19s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.0875
0.28571
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.14286
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Crashed
Add notes...
dk-crazydiv
6d 10h 6m 42s
-
1
["ai4bharat/indic-bert","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","neuralspace-reverie/indic-transformers-hi-bert","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
["BertForMaskedLM","RobertaForMaskedLM"]
0.09
0.22222
0
0.1
false
0
true
None
[]
None
bidi
false
0
true
false
false
false
1
false
128
0
2.11111
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
Crashed
Add notes...
hassi_ahk
5d 9h 17m 31s
-
1
["ai4bharat/indic-bert","export_torch_model","flax-community/roberta-pretraining-hindi","mrm8488/HindiBERTa","surajp/RoBERTa-hindi-guj-san"]
false
0.9
0.999
1.0000e-8
false
RobertaForMaskedLM
0.09
0.2
0
0.1
false
0
true
None
[]
None
-
false
0
true
false
false
false
1
false
128
0
2.1
None
8
500
epoch
false
auto
false
O1
0
1
false
None
false
gelu
1-15
of 15