Aurick-qiao's workspace
Runs
15
Name
15 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
activation_checkpointing
batch_size
datasets
debug
do_first_eval
eval_batch_size
eval_every
exp_name
fsdp_port
gradient_accumulation_steps
local_dirs
local_run_dir
loss.beta
loss.label_smoothing
loss.name
loss.reference_free
lr
max_grad_norm
max_length
max_prompt_length
minimum_log_interval_secs
model.archive
model.block_name
model.fsdp_policy_mp
model.name_or_path
model.policy_dtype
model.reference_dtype
n_epochs
n_eval_examples
n_eval_model_samples
optimizer
sample_during_eval
seed
trainer
wandb.enabled
wandb.project
warmup_steps
counters/examples
counters/updates
examples_per_second
grad_norm
logps_eval/chosen
logps_eval/rejected
logps_train/chosen
Finished
suqi-sun
3m 24s
-
false
32
["saferlhf"]
false
true
32
20000
saferlhf_dpo_ambersafe
51833
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/saferlhf_dpo_ambersafe_2024-01-31_23-17-32_355810
0.1
0
dpo
false
5.0000e-7
10
512
256
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-08_06-28-10_274941/LATEST/policy.pt
LlamaDecoderLayer
-
LLM360/AmberChat
float32
float16
3
256
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
1856
58
13.19972
26.05647
-123.636
-134.73872
-136.0524
Finished
suqi-sun
2m 33s
-
false
32
["saferlhf"]
false
true
32
20000
saferlhf_dpo_ambersafe
40233
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/saferlhf_dpo_ambersafe_2024-01-31_01-39-33_221995
0.1
0
dpo
false
5.0000e-7
10
512
256
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-08_06-28-10_274941/LATEST/policy.pt
LlamaDecoderLayer
-
LLM360/AmberChat
float32
float16
3
256
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
352
11
10.08821
32.88856
-123.636
-134.73872
-144.4724
Finished
suqi-sun
2m 11s
-
false
64
["saferlhf"]
false
true
32
19968
saferlhf_sft_ambersafe
51265
2
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/saferlhf_sft_ambersafe_2024-01-31_00-52-22_518363
-
-
sft
-
2.0000e-7
10
512
256
1
-
LlamaDecoderLayer
-
LLM360/AmberChat
float32
float16
3
256
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
960
15
54.35141
327.25186
-124.32336
-
-113.505
Finished
suqi-sun
21h 41m 38s
-
false
32
["ulfb_dpo"]
false
true
32
20000
amber359-2k-evol-mix-233k-ulfb-dpo
58779
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-dpo_2023-12-08_20-04-58_870360
0.1
0
dpo
false
5.0000e-7
10
1536
768
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-08_06-28-10_274941/LATEST/policy.pt
LlamaDecoderLayer
bfloat16
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
2000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
185856
5808
6.21776
8.83049
-349.04157
-318.20288
-288.32376
Finished
suqi-sun
8h 56m 20s
-
false
64
["ulfb_sft"]
false
true
32
19968
amber359-2k-evol-mix-233k-ulfb-sft
58545
8
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-08_06-28-10_274941
-
-
sft
-
5.0000e-7
10
2048
1024
1
-
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
1000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
185664
2901
7.27829
301.71808
-276.14359
-
-258.00789
Finished
suqi-sun
5h 55m 56s
-
false
32
["ulfb_dpo"]
false
true
32
20000
amber359-2k-evol-mix-233k-ulfb-dpo
37081
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-dpo_2023-12-08_00-22-45_248708
0.1
0
dpo
false
5.0000e-7
10
1536
768
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_09-34-40_083052/step-59904/policy.pt
LlamaDecoderLayer
bfloat16
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
2000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
50784
1587
1.69593
8.91695
-332.70033
-279.80697
-142.61129
Finished
suqi-sun
24m 55s
-
false
32
["ulfb_dpo"]
false
true
32
20000
amber359-2k-evol-mix-233k-ulfb-dpo
35925
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-dpo_2023-12-07_23-54-11_980948
0.1
0
dpo
false
5.0000e-7
10
1536
768
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_09-34-40_083052/step-59904/policy.pt
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
2000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
960
30
0.60119
24.41378
-289.35864
-232.36592
-257.08854
Finished
suqi-sun
22h 6m 45s
-
false
32
["ulfb_dpo"]
false
true
32
20000
amber359-2k-evol-mix-233k-ulfb-dpo
53965
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-dpo_2023-12-06_21-24-02_765747
0.1
0
dpo
false
0.00002
10
1536
768
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_09-34-40_083052/step-59904/policy.pt
LlamaDecoderLayer
bfloat16
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
2000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
185856
5808
6.118
39.0409
-699.73372
-718.51166
-518.69936
Failed
suqi-sun
9m 31s
-
false
32
["ulfb_dpo"]
false
true
32
20000
amber359-2k-evol-mix-233k-ulfb-dpo
34411
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-dpo_2023-12-06_21-06-33_105803
0.1
0
dpo
false
0.00002
10
2048
1024
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_09-34-40_083052/step-59904/policy.pt
LlamaDecoderLayer
bfloat16
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
2000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
608
19
5.12719
24.1697
-291.85681
-234.70524
-258.19247
Crashed
suqi-sun
11m 7s
-
false
32
["ulfb_dpo"]
false
true
32
20000
amber359-2k-evol-mix-233k-ulfb-dpo
57663
4
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-dpo_2023-12-06_20-44-04_217913
0.1
0
dpo
false
0.00002
10
2048
1024
1
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_09-34-40_083052/step-59904/policy.pt
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
2000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
256
8
0.95994
21.62825
-288.85763
-232.41629
-311.7993
Finished
suqi-sun
9h 33m 54s
-
false
64
["ulfb_sft"]
false
true
32
19968
amber359-2k-evol-mix-233k-ulfb-sft
57267
8
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_09-34-40_083052
-
-
sft
-
0.00002
10
2048
1024
1
-
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
1000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
185664
2901
7.87039
315.87082
-365.72541
-
-100.85411
Failed
suqi-sun
47m 21s
-
false
64
["ulfb_sft"]
false
true
32
19968
amber359-2k-evol-mix-233k-ulfb-sft
47715
8
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_07-35-18_878474
-
-
sft
-
0.00002
10
2048
1024
1
-
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
1000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
18752
293
6.68582
339.73132
-315.07494
-
-314.75331
Finished
suqi-sun
6m 8s
-
false
64
["ulfb_sft"]
false
true
32
19968
amber359-2k-evol-mix-233k-ulfb-sft
51313
8
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_07-27-17_721754
-
-
sft
-
2.0000e-7
10
2048
1024
1
-
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
1000
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
1664
26
6.60042
742.97821
-315.07494
-
-287.33608
Finished
suqi-sun
1m 28s
-
false
64
["ulfb_sft"]
false
true
32
19968
amber359-2k-evol-mix-233k-ulfb-sft
41963
8
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_07-23-36_822278
-
-
sft
-
2.0000e-7
10
2048
1024
1
-
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
256
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
192
3
7.8863
806.10657
-332.94446
-
-298.93626
Failed
suqi-sun
1m 53s
-
false
64
["ulfb_sft"]
false
true
32
19968
amber359-2k-evol-mix-233k-ulfb-sft
44591
2
["/scr-ssd","/scr","/rampart-stor/suqi/.cache"]
/rampart-stor/suqi/.cache/suqi.sun/amber359-2k-evol-mix-233k-ulfb-sft_2023-12-06_06-53-54_758780
-
-
sft
-
2.0000e-7
10
2048
1024
1
-
LlamaDecoderLayer
-
/rampart-stor/model_weights/amber359-2k-evol-mix-233k/
float32
float16
3
256
16
RMSprop
false
0
FSDPTrainer
true
direct-preference-optimization
150
-
-
-
-
-332.94446
-
-
1-15
of 15