D0rj's workspace
Runs
6
Name
6 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_attn_implementation_autoset
_name_or_path
accelerator_config.even_batches
accelerator_config.non_blocking
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
activation_function
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
allow_embedding_resizing
architectures
attention_bias
attention_dropout
attention_layer
attention_probs_dropout_prob
attn_out_bias
attn_out_dropout_prob
attn_qkv_bias
auto_find_batch_size
average_tokens_across_devices
batch_eval_metrics
bert_layer
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
classifier_activation
classifier_bias
classifier_dropout
classifier_pooling
cls_token_id
compile_model
dataloader_drop_last
dataloader_num_workers
dataloader_persistent_workers
dataloader_pin_memory
ddp_timeout
debug
decoder_bias
deterministic_flash_attn
disable_tqdm
Finished
-
d0rj
4h 51m 58s
-
true
deepvk/RuModernBERT-small
true
false
false
true
gelu
false
0.9
0.999
1.0000e-8
false
true
["ModernBertForMaskedLM"]
false
0
rope
0
false
0.1
false
false
false
false
prenorm
false
false
50281
0
gelu
false
0
cls
50281
true
false
0
false
true
1800
[]
true
false
false
Crashed
-
d0rj
11h 57m
-
true
deepvk/RuModernBERT-small
true
false
false
true
gelu
false
0.9
0.999
1.0000e-8
false
true
["ModernBertForMaskedLM"]
false
0
rope
0
false
0.1
false
false
false
false
prenorm
false
false
50281
0
gelu
false
0
cls
50281
true
false
0
false
true
1800
[]
true
false
false
Crashed
-
d0rj
11h 57m 46s
-
true
deepvk/RuModernBERT-small
true
false
false
true
gelu
false
0.9
0.999
1.0000e-8
false
true
["ModernBertForMaskedLM"]
false
0
rope
0
false
0.1
false
false
false
false
prenorm
false
false
50281
0
gelu
false
0
cls
50281
true
false
0
false
true
1800
[]
true
false
false
Crashed
-
d0rj
11h 57m 31s
-
true
deepvk/RuModernBERT-small
true
false
false
true
gelu
false
0.9
0.999
1.0000e-8
false
true
["ModernBertForMaskedLM"]
false
0
rope
0
false
0.1
false
false
false
false
prenorm
false
false
50281
0
gelu
false
0
cls
50281
true
false
0
false
true
1800
[]
true
false
false
Crashed
-
d0rj
11h 57m 49s
-
true
deepvk/RuModernBERT-small
true
false
false
true
gelu
false
0.9
0.999
1.0000e-8
false
true
["ModernBertForMaskedLM"]
false
0
rope
0
false
0.1
false
false
false
false
prenorm
false
false
50281
0
gelu
false
0
cls
50281
true
false
0
false
true
1800
[]
true
false
false
Crashed
-
d0rj
11h 58m
-
true
deepvk/RuModernBERT-small
true
false
false
true
gelu
false
0.9
0.999
1.0000e-8
false
true
["ModernBertForMaskedLM"]
false
0
rope
0
false
0.1
false
false
false
false
prenorm
false
false
50281
0
gelu
false
0
cls
50281
true
false
0
false
true
1800
[]
true
false
false
1-6
of 6