Randomfoo's workspace
Runs 
38
Name
0 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
adam_betas
adam_offload
apply_chat_template
aux_loss_coef
beta
bf16
chosen_key
ckpt_path
dataset
dataset_probs
dataset_split
deepcompile
disable_ds_ckpt
disable_fast_tokenizer
ds_tensor_parallel_size
eval_split
eval_steps
flash_attn
full_determinism
gradient_checkpointing
gradient_checkpointing_use_reentrant
ipo
l2
label_smoothing
learning_rate
load_checkpoint
load_in_4bit
local_rank
logging_steps
lora_alpha
lora_dropout
lora_rank
lr_warmup_ratio
max_ckpt_mem
max_ckpt_num
max_epochs
max_len
max_norm
max_samples
micro_train_batch_size
nll_loss_coef
overlap_comm
packing_samples
pretrain
Finished
-
randomfoo
12h 58m 24s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
1.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
1
1
1024
1
1000000
1
0
true
true
/fsx2/global_step4500_hf
Finished
-
randomfoo
12h 38m 23s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
4.0000e-8
false
false
-1
1
16
0
0
0.05
100000000
1
1
1024
1
1000000
1
0
true
true
/fsx2/global_step4500_hf
Finished
-
randomfoo
46m 11s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
2.8900e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
4
0
true
true
shisa-ai/ablation-195-finalsft2-shisa-v2-mistral-small-24b
Finished
-
randomfoo
12h 54m 53s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
7.0000e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
1024
1
1000000
1
0
true
true
/fsx2/global_step4500_hf
Crashed
-
randomfoo
19m 16s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
6.6400e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
1024
1
1000000
1
0
true
true
/fsx2/checkpoints/global_step6000_hf
Failed
-
randomfoo
31s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
5.0000e-7
false
false
-1
1
512
0.05
256
0.05
100000000
3
1
4096
1
1000000
1
0
true
true
/fsx2/checkpoints/global_step6000_hf
Crashed
-
randomfoo
45m 16s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
6.6400e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
512
1
1000000
1
0
true
true
/fsx2/checkpoints/global_step6000_hf
Crashed
-
randomfoo
5h 6m 46s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
6.6400e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
1024
1
1000000
1
0
true
true
/fsx2/checkpoints/global_step6000_hf
Crashed
-
randomfoo
3m 16s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
6.6400e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
1536
1
1000000
1
0
true
true
/fsx2/checkpoints/global_step6000_hf
Finished
-
randomfoo
1h 44m 37s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
8.0000e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 47m 58s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
5.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 45m 25s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
2.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 47m 13s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
3.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 43m 13s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
5.0000e-8
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 48m 10s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
8.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 46m 38s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
1.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
2048
1
1000000
8
0
true
true
/fsx2/outputs/ablation-163-shisav2.if50-shisa-v2-llama-3.1-8b
Finished
-
randomfoo
1h 20m 28s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
3.0000e-7
false
false
-1
1
16
0
0
0.03
100000000
3
1
4096
1
1000000
4
0
true
true
/fsx2/outputs/ablation-179-finalsft2-shisa-v2-unphi-4-14b
Finished
-
randomfoo
2h 32m 32s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
2.0000e-7
false
false
-1
1
16
0
0
0.05
100000000
3
1
4096
1
1000000
4
0
true
true
/fsx2/outputs/ablation-180-finalsft2-shisa-v2-llama-3.3-70b
Finished
-
randomfoo
1h 13m 50s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
3.0000e-7
false
false
-1
1
16
0
0
0.03
100000000
3
1
4096
1
1000000
4
0
true
true
/fsx2/outputs/ablation-153-finalsft-shisa-v2-unphi-4-14b
Finished
-
randomfoo
1h 13m 51s
-
[0.9,0.95]
false
true
0
0.1
true
chosen
./ckpt/checkpoints_dpo
/fsx/ubuntu/meti/data/openrlhf/dpo.shisa-v2.jsonl
1.0
-
-
false
false
-
test
-1
true
false
true
false
false
0
0
9.0000e-7
false
false
-1
1
16
0
0
0.03
100000000
3
1
4096
1
1000000
4
0
true
true
/fsx2/outputs/ablation-153-finalsft-shisa-v2-unphi-4-14b
1-20
of 38