torchtune_codellama_testing Table

Salman-mohammadi's workspace

Runs

gpu_resources

loss

peak_memory_active

Finished

salman-mohammadi

1y ago

1m 16s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/CodeLlama-7b-hf

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/qlora_code_llama2_finetune_output/torchtune_perf_tracing.json

torchtune_codellama_testing

torchtune.models.code_llama2.qlora_code_llama2_7b

false

["q_proj","v_proj"]

torch.optim.AdamW

0.0003

0.01

true

/tmp/qlora_code_llama2_finetune_output

torchtune.utils.profiler

false

/tmp/qlora_code_llama2_finetune_output/torchtune_perf_tracing.json

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-hf/tokenizer.model

12647949824

1.53467

12.85234

Finished

salman-mohammadi

1y ago

torchtune.utils.FullModelHFCheckpointer

/tmp/Llama-2-7b-hf

["pytorch_model-00001-of-00002.bin","pytorch_model-00002-of-00002.bin"]

LLAMA2

/tmp/Llama-2-7b-hf

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/qlora_finetune_output/

torchtune_codellama_testing

torchtune.models.llama2.qlora_llama2_7b

true

false

["q_proj","v_proj","k_proj","output_proj"]

torch.optim.AdamW

0.0003

0.01

/tmp/qlora_finetune_output/

torchtune.utils.profiler

false

/tmp/qlora_finetune_output//torchtune_perf_tracing.json

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/Llama-2-7b-hf/tokenizer.model

Finished

salman-mohammadi

1y ago

50s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/CodeLlama-7b-hf

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/lora_code_llama2_finetune_output/torchtune_perf_tracing.json

torchtune_codellama_testing

torchtune.models.code_llama2.lora_code_llama2_7b

false

["q_proj","v_proj"]

torch.optim.AdamW

0.0003

0.01

true

/tmp/lora_code_llama2_finetune_output

torchtune.utils.profiler

false

/tmp/lora_code_llama2_finetune_output/torchtune_perf_tracing.json

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-hf/tokenizer.model

14211938816

1.62569

14.13296

Finished

salman-mohammadi

1y ago

52s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/CodeLlama-7b-hf

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/lora_code_llama2_finetune_output/torchtune_perf_tracing.json

torchtune_codellama_testing

torchtune.models.code_llama2.lora_code_llama2_7b

false

["q_proj","v_proj"]

torch.optim.AdamW

0.0003

0.01

true

/tmp/lora_code_llama2_finetune_output

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-hf/tokenizer.model

Finished

salman-mohammadi

1y ago

15s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/CodeLlama-7b-hf

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/lora_code_llama2_finetune_output/torchtune_perf_tracing.json

torchtune_codellama_testing

torchtune.models.lora_code_llama2.code_llama2_7b

false

["q_proj","v_proj"]

torch.optim.AdamW

0.0003

0.01

true

/tmp/lora_code_llama2_finetune_output

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-hf/tokenizer.model

Finished

salman-mohammadi

1y ago

2m 32s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/CodeLlama-7b-hf

false

torchtune.datasets.alpaca_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.utils.metric_logging.WandBLogger

/tmp/code_llama2_finetune

torchtune_codellama_testing

torchtune.models.code_llama2.code_llama2_7b

bitsandbytes.optim.PagedAdamW

0.00002

true

/tmp/code_llama2_finetune

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-hf/tokenizer.model

13902832640

1.24063

0.00002

Finished

salman-mohammadi

1y ago

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/CodeLlama-7b-hf

false

torchtune.datasets.alpaca_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.utils.metric_logging.WandBLogger

/tmp/code_llama2_finetune

torchtune_codellama_testing

torchtune.models.code_llama2.code_llama2_7b

bitsandbytes.optim.PagedAdamW

0.00002

true

/tmp/code_llama2_finetune

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-hf/tokenizer.model

Finished

salman-mohammadi

1y ago

41m 41s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-Instruct-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/Llama-2-7b-hf

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/lora_finetune_output

torchtune_codellama_testing

torchtune.models.llama2.lora_code_llama2_7b

false

["q_proj","v_proj"]

torch.optim.AdamW

0.0003

0.01

/tmp/lora_finetune_output

torchtune.utils.profiler

false

/tmp/lora_finetune_output/torchtune_perf_tracing.json

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-Instruct-hf/tokenizer.model

13919330304

1.41144

0.000165

14.58847

Finished

salman-mohammadi

1y ago

58m 11s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-13b-Instruct-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/Llama-2-13b-hf/

false

torchtune.datasets.alpaca_cleaned_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.modules.get_cosine_schedule_with_warmup

100

torchtune.utils.metric_logging.WandBLogger

/tmp/qlora_finetune_output/

torchtune_codellama_testing

torchtune.models.llama2.qlora_code_llama2_13b

true

false

["q_proj","v_proj","k_proj","output_proj"]

torch.optim.AdamW

0.0003

0.01

/tmp/qlora_finetune_output/

torchtune.utils.profiler

false

/tmp/qlora_finetune_output//torchtune_perf_tracing.json

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-13b-Instruct-hf/tokenizer.model

8594478080

1.29708

0.000093

9.45774

Finished

salman-mohammadi

1y ago

24m 4s

torchtune.utils.FullModelHFCheckpointer

/tmp/CodeLlama-7b-Instruct-hf

["pytorch_model-00001-of-00003.bin","pytorch_model-00002-of-00003.bin","pytorch_model-00003-of-00003.bin"]

LLAMA2

/tmp/Llama-2-7b-hf

false

torchtune.datasets.alpaca_dataset

true

cuda

bf16

true

torch.nn.CrossEntropyLoss

torchtune.utils.metric_logging.WandBLogger

/tmp/alpaca-llama2-finetune

torchtune_codellama_testing

torchtune.models.llama2.code_llama2_7b

bitsandbytes.optim.PagedAdamW

0.00002

true

/tmp/alpaca-llama2-finetune

false

true

torchtune.models.llama2.llama2_tokenizer

/tmp/CodeLlama-7b-Instruct-hf/tokenizer.model

14020930048

1.31372

0.00002

14.44884

1-10

of 10