jcummings

Jcummings's workspace

Runs

Killed

jcummings

11mo ago

2m 54s

torchtune.training.FullModelHFCheckpointer

/tmp/Meta-Llama-3.1-8B-Instruct/

["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]

LLAMA3

/tmp/Meta-Llama-3.1-8B-Instruct/

false

torchtune.datasets.stack_exchange_paired_dataset

cuda

bf16

true

false

true

torchtune.rlhf.loss.DPOLoss

0.1

torchtune.training.lr_schedulers.get_cosine_schedule_with_warmup

100

torchtune.training.metric_logging.WandBLogger

test-123-dpo

torchtune.models.llama3_1.lora_llama3_1_8b

true

false

["q_proj","v_proj","output_proj"]

torch.optim.AdamW

true

0.0005

0.05

/tmp/lora_finetune_output

torchtune.training.setup_torch_profiler

true

false

/tmp/lora_finetune_output/profiling_outputs

Killed

jcummings

11mo ago

2m 13s

torchtune.training.FullModelHFCheckpointer

/tmp/Meta-Llama-3.1-8B-Instruct/

["model-00001-of-00004.safetensors","model-00002-of-00004.safetensors","model-00003-of-00004.safetensors","model-00004-of-00004.safetensors"]

LLAMA3

/tmp/Meta-Llama-3.1-8B-Instruct/

false

["tok_embeddings","output"]

torchtune.datasets.stack_exchange_paired_dataset

cuda

bf16

true

false

true

torchtune.rlhf.loss.DPOLoss

0.1

torchtune.training.lr_schedulers.get_cosine_schedule_with_warmup

100

torchtune.training.metric_logging.WandBLogger

test-123-dpo

torchtune.models.llama3_1.lora_llama3_1_8b

true

false

["q_proj","v_proj","output_proj"]

torch.optim.AdamW

true

0.0005

0.05

/tmp/lora_finetune_output

torchtune.training.setup_torch_profiler

true

false

/tmp/lora_finetune_output/profiling_outputs

1-2

of 2