Randomfoo's workspace
Runs
6
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
accelerator_config.even_batches
accelerator_config.non_blocking
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
accumulate_allreduce_grads_in_fp32
adafactor
adam_beta1
adam_beta2
adam_betas
adam_eps
adam_epsilon
adam_offload
add_bias_linear
add_cross_attention
add_position_embedding
add_qkv_bias
adlr_autoresume
adlr_autoresume_interval
align_grad_reduce
align_param_gather
app_tag_run_version
apply_chat_template
apply_layernorm_1p
apply_query_key_layer_scaling
apply_residual_connection_post_layernorm
apply_rope_fusion
architectures
async_tensor_model_parallel_allreduce
attention_backend
attention_bias
attention_dropout
attention_sink_k
attention_softmax_in_fp32
attn_implementation
auto_detect_ckpt_format
auto_find_batch_size
aux_loss_coef
average_tokens_across_devices
barrier_with_L1_time
batch_eval_metrics
bench_dataset
bench_source_max_len
bench_split
Finished
-
randomfoo
1h 24m 29s
-
meta-llama/Llama-3.2-1B-Instruct
true
false
false
true
-
false
0.9
0.999
-
-
1.0000e-8
-
-
false
-
-
-
-
-
-
-
-
-
-
-
-
["LlamaForCausalLM"]
-
-
false
0
-
-
-
-
false
-
false
-
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
Finished
-
randomfoo
27m 33s
-
-
-
-
-
-
-
-
-
-
[0.9,0.95]
-
-
false
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
-
-
-
-
-
flash_attention_2
-
-
0
-
-
-
-
-
-
Finished
-
randomfoo
2h 14m 17s
-
-
-
-
-
-
-
-
-
-
[0.9,0.95]
-
-
false
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
-
-
-
-
-
flash_attention_2
-
-
0
-
-
-
-
-
-
Finished
-
randomfoo
2h 1m
-
-
-
-
-
-
-
-
-
-
[0.9,0.95]
-
-
false
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
-
-
-
-
-
flash_attention_2
-
-
0
-
-
-
-
-
-
Finished
-
randomfoo
9h 50m 10s
-
-
-
-
-
-
true
-
0.9
0.999
-
1.0000e-8
-
-
false
-
true
false
false
1000
true
false
0.0.0
-
false
false
false
true
-
false
auto
-
0.1
0
false
-
false
-
-
-
true
-
-
-
-
Finished
-
randomfoo
8h 34m 31s
-
-
-
-
-
-
-
-
-
-
[0.9,0.95]
-
-
false
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
-
-
-
-
-
flash_attention_2
-
-
0
-
-
-
-
-
-
1-6
of 6