Randomfoo's workspace
Runs
23
Name
4 visualized
State
Finished
Killed
Killed
Killed
Finished
Crashed
Crashed
Crashed
Finished
Finished
Finished
Finished
Failed
Finished
Finished
Finished
Finished
Finished
Finished
Finished
_name_or_path
accelerator_config.even_batches
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_bias
attention_dropout
auto_find_batch_size
batch_size
bf16
bf16_full_eval
bos_token_id
checkpointer._component_
checkpointer.checkpoint_dir
checkpointer.checkpoint_files
checkpointer.model_type
checkpointer.output_dir
chunk_size_feed_forward
compile
dataloader_drop_last
dataloader_num_workers
dataloader_persistent_workers
dataloader_pin_memory
dataset._component_
dataset.max_seq_len
dataset.packed
ddp_timeout
debug
device
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
dtype
early_stopping
enable_activation_checkpointing
encoder_no_repeat_ngram_size
eos_token_id
epochs
eval_delay
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
-
-
-
-
-
-
-
-
-
-
-
-
-
16
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
bf16
-
false
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
32
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
fp32
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
32
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
false
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
fp32
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
32
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
fp32
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
64
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
64
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.training.FullModelHFCheckpointer
/tune/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tune/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
-
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
meta-llama/Meta-Llama-3-8B-Instruct
true
false
true
false
0.9
0.999
1.0000e-8
false
["LlamaForCausalLM"]
false
0
false
-
true
false
128000
-
-
-
-
-
0
-
false
0
false
true
-
-
-
1800
[]
-
false
0
false
false
false
false
-
false
-
0
128009
-
0
no
false
auto
false
meta-llama/Meta-Llama-3-8B-Instruct
true
false
true
false
0.9
0.999
1.0000e-8
false
["LlamaForCausalLM"]
false
0
false
-
true
false
128000
-
-
-
-
-
0
-
false
0
false
true
-
-
-
1800
[]
-
false
0
false
false
false
false
-
false
-
0
128009
-
0
no
false
auto
false
meta-llama/Meta-Llama-3-8B-Instruct
true
false
true
false
0.9
0.999
1.0000e-8
false
["LlamaForCausalLM"]
false
0
false
-
true
false
128000
-
-
-
-
-
0
-
false
0
false
true
-
-
-
1800
[]
-
false
0
false
false
false
false
-
false
-
0
128009
-
0
no
false
auto
false
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.utils.FullModelHFCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
meta-llama/Meta-Llama-3-8B-Instruct
true
false
true
false
0.9
0.999
1.0000e-8
false
["LlamaForCausalLM"]
false
0
false
-
true
false
128000
-
-
-
-
-
0
-
true
0
false
true
-
-
-
1800
[]
-
false
0
true
false
false
false
-
false
-
0
128009
-
0
epoch
false
auto
false
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.utils.FullModelHFCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.utils.FullModelHFCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
false
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.utils.FullModelMetaCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/original/
["consolidated.00.pth"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
4
-
-
-
torchtune.utils.FullModelHFCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
false
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.utils.FullModelMetaCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/original/
["consolidated.00.pth"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
false
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1
-
-
-
torchtune.utils.FullModelMetaCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/original/
["consolidated.00.pth"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
true
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
torchtune.utils.FullModelHFCheckpointer
/models/llm/hf/Meta-Llama-3-8B-Instruct/
["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]
LLAMA3
/tmp/Meta-Llama-3-8B-Instruct/
-
false
-
-
-
-
torchtune.datasets.alpaca_cleaned_dataset
2048
true
-
-
cuda
-
-
-
-
-
-
bf16
-
true
-
-
1
-
-
-
-
-
1-20
of 23