Angus27's workspace
Runs
2
State
Notes
User
Tags
Created
Runtime
Sweep
_attn_implementation_autoset
_name_or_path
accelerator_config.even_batches
accelerator_config.non_blocking
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_probs_dropout_prob
auto_find_batch_size
average_tokens_across_devices
batch_eval_metrics
batch_size
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_persistent_workers
dataloader_pin_memory
ddp_timeout
debug
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
early_stopping
encoder_no_repeat_ngram_size
eos_token_id
epochs
eval_delay
eval_do_concat_batches
eval_on_start
eval_strategy
eval_use_gather_object
fp16
fp16_backend
Finished
angus27
8m 24s
-
true
distilroberta-base
true
false
false
true
false
0.9
0.999
1.0000e-8
false
["RobertaForMaskedLM"]
0.1
false
false
false
16
false
false
0
0
false
0
false
true
1800
[]
false
0
false
false
false
false
false
0
2
3
0
true
false
no
false
false
auto
Finished
angus27
1h 8m 3s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1-2
of 2