upup-ashton-wang-usc

Upup-ashton-wang's workspace

Runs

host_model_post_train_dataset_name

host_model_post_train_type

Finished

upup-ashton-wang

6mo ago

15d 21h 36m 17s

0.00001

500

true

["/home/omer/shangshang/project/reasoning/reasoning-sae/ckpts/models/DeepSeek-R1-Distill-Qwen-1.5B/base","/project/neiswang_1391/shangsha/reasoning/reasoning-sae/ckpts/models/DeepSeek-R1-Distill-Qwen-1.5B/base"]

true

false

true

false

0.9

0.999

1.0000e-8

false

Qwen2ForCausalLM

false

true

false

151643

<CHARS_PER_TOKEN>

false

Finished

upup-ashton-wang

6mo ago

3mo 7d 20h 42m 38s

DeepSeek-R1-Distill-Qwen-1.5B

["checkpoint-0","checkpoint-1000","checkpoint-2000"]

["curated_deepscaler","curated_still"]

grpo

0.000001

128

0.05

["down_proj","gate_proj","k_proj","o_proj","q_proj","up_proj","v_proj"]

["layers.12.mlp","model.layers.12"]

sae-DeepSeek-R1-Distill-Qwen-1.5B-65k

500

2.11111

sft_r1_distill

DeepSeek-R1-Distill-Qwen-1.5B

Finished

upup-ashton-wang

5mo ago

12h 17m 17s

DeepSeek-R1-Distill-Qwen-1.5B

["checkpoint-1","checkpoint-10","checkpoint-100","checkpoint-50"]

curated_still

grpo

0.000001

128

0.05

["down_proj","gate_proj","k_proj","o_proj","q_proj","up_proj","v_proj"]

model.layers.12

sae-DeepSeek-R1-Distill-Qwen-1.5B-65k

500

sft_r1_distill

DeepSeek-R1-Distill-Qwen-1.5B

Finished

upup-ashton-wang

5mo ago

10d 15h 43m 6s

DeepSeek-R1-Distill-Qwen-1.5B

checkpoint-2000

curated_still

grpo

0.000001

128

0.05

["down_proj","gate_proj","k_proj","o_proj","q_proj","up_proj","v_proj"]

model.layers.12

sae-DeepSeek-R1-Distill-Qwen-1.5B-65k

500

sft_r1_distill

DeepSeek-R1-Distill-Qwen-1.5B

Finished

upup-ashton-wang

5mo ago

7h 38m 7s

DeepSeek-R1-Distill-Qwen-1.5B

["checkpoint-1","checkpoint-10","checkpoint-100","checkpoint-3000","checkpoint-50","checkpoint-500"]

curated_still

grpo

0.000001

128

0.05

["down_proj","gate_proj","k_proj","o_proj","q_proj","up_proj","v_proj"]

model.layers.12

sae-DeepSeek-R1-Distill-Qwen-1.5B-65k

500

sft_r1_distill

DeepSeek-R1-Distill-Qwen-1.5B

Finished

upup-ashton-wang

6mo ago

1d 12h 20m 2s

DeepSeek-R1-Distill-Qwen-1.5B

checkpoint-2000

curated_still

grpo

0.000001

128

0.05

["down_proj","gate_proj","k_proj","o_proj","q_proj","up_proj","v_proj"]

["model.layers.16","model.layers.17","model.layers.18","model.layers.20","model.layers.21","model.layers.22","model.layers.23","model.layers.24","model.layers.25","model.layers.26"]

sae-DeepSeek-R1-Distill-Qwen-1.5B-65k

500

2.08696

false

Qwen2.5-Math-1.5B

sft_r1_distill

DeepSeek-R1-Distill-Qwen-1.5B

1-6

of 6