Alexander-f-moreno's workspace
Runs
8
Name
8 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
actor_rollout_ref.actor.checkpoint.async_save
actor_rollout_ref.actor.checkpoint.contents
actor_rollout_ref.actor.checkpoint.load_contents
actor_rollout_ref.actor.checkpoint.save_contents
actor_rollout_ref.actor.clip_ratio
actor_rollout_ref.actor.clip_ratio_c
actor_rollout_ref.actor.clip_ratio_high
actor_rollout_ref.actor.clip_ratio_low
actor_rollout_ref.actor.entropy_coeff
actor_rollout_ref.actor.fsdp_config.fsdp_size
actor_rollout_ref.actor.fsdp_config.optimizer_offload
actor_rollout_ref.actor.fsdp_config.param_offload
actor_rollout_ref.actor.fsdp_config.wrap_policy.min_num_params
actor_rollout_ref.actor.grad_clip
actor_rollout_ref.actor.kl_loss_coef
actor_rollout_ref.actor.kl_loss_type
actor_rollout_ref.actor.load_weight
actor_rollout_ref.actor.loss_agg_mode
actor_rollout_ref.actor.megatron.context_parallel_size
actor_rollout_ref.actor.megatron.expert_model_parallel_size
actor_rollout_ref.actor.megatron.grad_offload
actor_rollout_ref.actor.megatron.optimizer_offload
actor_rollout_ref.actor.megatron.param_offload
actor_rollout_ref.actor.megatron.pipeline_model_parallel_size
actor_rollout_ref.actor.megatron.seed
actor_rollout_ref.actor.megatron.sequence_parallel
actor_rollout_ref.actor.megatron.tensor_model_parallel_size
actor_rollout_ref.actor.megatron.use_dist_checkpointing
actor_rollout_ref.actor.megatron.use_distributed_optimizer
actor_rollout_ref.actor.megatron.use_mbridge
actor_rollout_ref.actor.optim.clip_grad
actor_rollout_ref.actor.optim.lr
actor_rollout_ref.actor.optim.lr_decay_style
actor_rollout_ref.actor.optim.lr_warmup_init
actor_rollout_ref.actor.optim.lr_warmup_steps
actor_rollout_ref.actor.optim.lr_warmup_steps_ratio
actor_rollout_ref.actor.optim.lr_wsd_decay_style
actor_rollout_ref.actor.optim.min_lr
actor_rollout_ref.actor.optim.min_lr_ratio
actor_rollout_ref.actor.optim.optimizer
actor_rollout_ref.actor.optim.total_training_steps
actor_rollout_ref.actor.optim.use_checkpoint_opt_param_scheduler
actor_rollout_ref.actor.optim.warmup_style
actor_rollout_ref.actor.optim.weight_decay
Crashed
-
z6cheng
2d 19h 27m
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.2
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
1790
-
constant
0.1
Crashed
-
z6cheng
9d 6h 32m
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
1790
-
constant
0.1
Crashed
-
z6cheng
8h 16m 36s
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
1790
-
constant
0.1
Finished
-
z6cheng
2d 1h 38m 51s
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
1790
-
constant
0.1
Finished
-
z6cheng
6d 3h 27m 11s
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.2
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
1790
-
constant
0.1
Crashed
-
z6cheng
3d 23h 39m 30s
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
1790
-
constant
0.1
Crashed
-
leoii22
20h 40m 30s
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.2
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
608
-
constant
0.1
Crashed
-
leoii22
15h 42m 31s
-
-
["model","hf_model","optimizer","extra"]
-
-
0.2
10
0.2
0.2
0
-1
true
true
0
1
0
low_var_kl
-
token-mean
-
-
-
-
-
-
-
-
-
-
-
-
-
0.000001
-
-
10
0
-
-
0
-
608
-
constant
0.1
1-8
of 8