qwen2-1.5b-lora-distributed Table

Ebs's workspace

Runs

Finished

ebs

10mo ago

1m 20s

torchtune.training.FullModelHFCheckpointer

/tmp/Qwen2-1.5B-Instruct

["model.safetensors"]

QWEN2

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.datasets.alpaca_cleaned_dataset

cuda

bf16

true

torchtune.modules.loss.CEWithChunkedOutputLoss

torchtune.training.lr_schedulers.get_cosine_schedule_with_warmup

100

torchtune.training.metric_logging.WandBLogger

/tmp/Qwen2-1.5B-Instruct-lora-finetune

baseline-bsz16-ga1

qwen2-1.5b-lora-distributed

torchtune.models.qwen2.lora_qwen2_1_5b

false

["q_proj","v_proj"]

torch.optim.AdamW

true

0.00002

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.training.setup_torch_profiler

true

false

/tmp/Qwen2-1.5B-Instruct-lora-finetune/profiling_outputs

false

true

false

Finished

ebs

10mo ago

8m 33s

torchtune.training.FullModelHFCheckpointer

/tmp/Qwen2-1.5B-Instruct

["model.safetensors"]

QWEN2

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.datasets.alpaca_cleaned_dataset

cuda

bf16

true

torchtune.modules.loss.CEWithChunkedOutputLoss

torchtune.training.lr_schedulers.get_cosine_schedule_with_warmup

100

torchtune.training.metric_logging.WandBLogger

/tmp/Qwen2-1.5B-Instruct-lora-finetune

baseline-bsz1-ga16

qwen2-1.5b-lora-distributed

torchtune.models.qwen2.lora_qwen2_1_5b

false

["q_proj","v_proj"]

torch.optim.AdamW

true

0.00002

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.training.setup_torch_profiler

true

false

/tmp/Qwen2-1.5B-Instruct-lora-finetune/profiling_outputs

false

true

false

Finished

ebs

10mo ago

1m 21s

torchtune.training.FullModelHFCheckpointer

/tmp/Qwen2-1.5B-Instruct

["model.safetensors"]

QWEN2

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.datasets.alpaca_cleaned_dataset

cuda

bf16

true

torchtune.modules.loss.CEWithChunkedOutputLoss

torchtune.training.lr_schedulers.get_cosine_schedule_with_warmup

100

torchtune.training.metric_logging.WandBLogger

/tmp/Qwen2-1.5B-Instruct-lora-finetune

new-bsz16-ga1

qwen2-1.5b-lora-distributed

torchtune.models.qwen2.lora_qwen2_1_5b

false

["q_proj","v_proj"]

torch.optim.AdamW

true

0.00002

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.training.setup_torch_profiler

true

false

/tmp/Qwen2-1.5B-Instruct-lora-finetune/profiling_outputs

false

true

false

Finished

ebs

10mo ago

8m 34s

torchtune.training.FullModelHFCheckpointer

/tmp/Qwen2-1.5B-Instruct

["model.safetensors"]

QWEN2

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.datasets.alpaca_cleaned_dataset

cuda

bf16

true

torchtune.modules.loss.CEWithChunkedOutputLoss

torchtune.training.lr_schedulers.get_cosine_schedule_with_warmup

100

torchtune.training.metric_logging.WandBLogger

/tmp/Qwen2-1.5B-Instruct-lora-finetune

new-bsz1-ga16

qwen2-1.5b-lora-distributed

torchtune.models.qwen2.lora_qwen2_1_5b

false

["q_proj","v_proj"]

torch.optim.AdamW

true

0.00002

/tmp/Qwen2-1.5B-Instruct-lora-finetune

torchtune.training.setup_torch_profiler

true

false

/tmp/Qwen2-1.5B-Instruct-lora-finetune/profiling_outputs

false

true

false

1-4

of 4