Jiayipan's workspace
Runs
11
Name
1 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
actor_rollout_ref.actor.clip_ratio
actor_rollout_ref.actor.entropy_coeff
actor_rollout_ref.actor.fsdp_config.fsdp_size
actor_rollout_ref.actor.fsdp_config.grad_offload
actor_rollout_ref.actor.fsdp_config.optimizer_offload
actor_rollout_ref.actor.fsdp_config.param_offload
actor_rollout_ref.actor.fsdp_config.wrap_policy.min_num_params
actor_rollout_ref.actor.grad_clip
actor_rollout_ref.actor.kl_loss_coef
actor_rollout_ref.actor.kl_loss_type
actor_rollout_ref.actor.optim.lr
actor_rollout_ref.actor.optim.lr_warmup_steps_ratio
actor_rollout_ref.actor.optim.total_training_steps
actor_rollout_ref.actor.optim.warmup_style
actor_rollout_ref.actor.ppo_epochs
actor_rollout_ref.actor.ppo_max_token_len_per_gpu
actor_rollout_ref.actor.ppo_micro_batch_size
actor_rollout_ref.actor.ppo_mini_batch_size
actor_rollout_ref.actor.shuffle
actor_rollout_ref.actor.strategy
actor_rollout_ref.actor.ulysses_sequence_parallel_size
actor_rollout_ref.actor.use_dynamic_bsz
actor_rollout_ref.actor.use_kl_loss
actor_rollout_ref.hybrid_engine
actor_rollout_ref.model.enable_gradient_checkpointing
actor_rollout_ref.model.path
actor_rollout_ref.model.use_remove_padding
actor_rollout_ref.ref.fsdp_config.fsdp_size
actor_rollout_ref.ref.fsdp_config.param_offload
actor_rollout_ref.ref.fsdp_config.wrap_policy.min_num_params
actor_rollout_ref.ref.log_prob_max_token_len_per_gpu
actor_rollout_ref.ref.log_prob_micro_batch_size
actor_rollout_ref.ref.log_prob_use_dynamic_bsz
actor_rollout_ref.ref.ulysses_sequence_parallel_size
actor_rollout_ref.rollout.do_sample
actor_rollout_ref.rollout.dtype
actor_rollout_ref.rollout.enforce_eager
actor_rollout_ref.rollout.free_cache_engine
actor_rollout_ref.rollout.gpu_memory_utilization
actor_rollout_ref.rollout.ignore_eos
actor_rollout_ref.rollout.load_format
actor_rollout_ref.rollout.log_prob_max_token_len_per_gpu
actor_rollout_ref.rollout.log_prob_micro_batch_size
actor_rollout_ref.rollout.log_prob_use_dynamic_bsz
Crashed
-
jiayipan
2h 40m 31s
-
0.2
0.001
-1
false
false
false
0
1
0.001
low_var_kl
0.000001
0
128000
constant
1
16384
8
128
false
fsdp
1
false
false
true
false
/data/models/Qwen2.5-3B
false
-1
false
0
16384
4
false
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
16384
8
false
Crashed
-
jiayipan
1h 10m 32s
-
0.2
0.001
-1
false
false
false
0
1
0.001
low_var_kl
0.000001
0
128000
constant
1
16384
8
128
false
fsdp
1
false
false
true
false
/data/models/Qwen2.5-3B
false
-1
false
0
16384
4
false
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
16384
8
false
Crashed
-
jiayipan
8h 12m 1s
-
0.2
0.001
-1
false
false
false
0
1
0.001
low_var_kl
0.000001
0
320000
constant
1
16384
8
128
false
fsdp
1
false
false
true
false
/data/models/Qwen2.5-3B
false
-1
false
0
16384
4
false
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
16384
8
false
Crashed
-
jiayipan
6h 49m 32s
-
0.2
0.001
-1
false
false
false
0
1
0.001
low_var_kl
0.000001
0
64000
constant
1
16384
8
128
false
fsdp
1
false
false
true
false
/data/models/Qwen2.5-3B
false
-1
false
0
16384
4
false
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
16384
8
false
Crashed
-
jiayipan
3h 2m 1s
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
Qwen/Qwen2.5-1.5B
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
Crashed
-
jiayipan
2h 39m 31s
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
Qwen/Qwen2.5-7B
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
Crashed
-
jiayipan
2h 21m 1s
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
openlm-research/open_llama_7b_v2
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
Crashed
-
jiayipan
6h 29m
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
Qwen/Qwen2.5-3B-Instruct
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
Crashed
-
jiayipan
3h 9m 1s
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
Qwen/Qwen2.5-0.5B
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
Crashed
-
jiayipan
5h 43m 46s
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
Qwen/Qwen2.5-1.5B
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
Crashed
-
jiayipan
4h 44m 31s
-
0.2
0.001
-1
false
false
false
0
1
-
-
0.000001
0
19200
constant
1
-
8
128
false
fsdp
1
-
-
true
false
Qwen/Qwen2.5-3B
false
-1
false
0
-
4
-
1
true
bfloat16
true
true
0.4
false
dummy_dtensor
-
8
-
1-11
of 11