Tonghezhang01's workspace
Runs
17
Name
17 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_target_
act_steps
action_dim
base_policy_path
batch_size
cond_steps
dataset_dir
denoising_steps
device
egl_device
env.best_reward_threshold_for_success
env.max_episode_steps
env.n_envs
env.name
env.reset_at_iteration
env.save_video
env.wrappers.mujoco_locomotion_lowdim.normalization_path
env.wrappers.multi_step.max_episode_steps
env.wrappers.multi_step.n_action_steps
env.wrappers.multi_step.n_obs_steps
env.wrappers.multi_step.reset_within_step
env_name
ft_denoising_steps
horizon_steps
logdir
max_std
min_std
model._target_
model.act_dim
model.act_max
model.act_min
model.action_dim
model.actor._target_
model.actor.action_dim
model.actor.cond_dim
model.actor.cond_mlp_dims
model.actor.cond_steps
model.actor.hidden_dim
model.actor.horizon_steps
model.actor.mlp_dims
model.actor.obs_dim
model.actor.residual_style
model.actor.time_dim
model.actor_policy_path
Finished
-
tonghezhang01
1d 2h 5m 43s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/zhangtonghe/dppo/data/gym/kitchen-mixed-v0
4
cuda:5
cuda:5
4
280
1
kitchen-mixed-v0
false
false
/home/zhangtonghe/dppo/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/zhangtonghe/dppo/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4_seed42/2025-05-25_12-39-58_42
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Finished
-
tonghezhang01
11h 24m 7s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0
4
cuda:5
cuda:5
4
280
1
kitchen-mixed-v0
false
false
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/yuchao/ReinFlow/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4/2025-05-24_22-13-24_2025
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Finished
-
tonghezhang01
1d 3h 30m 48s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0
4
cuda:0
cuda:0
4
280
1
kitchen-mixed-v0
false
false
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/yuchao/ReinFlow/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4_seed509/2025-05-10_21-40-09_509
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Finished
-
tonghezhang01
1d 3h 31m 45s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0
4
cuda:1
cuda:1
4
280
1
kitchen-mixed-v0
false
false
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/yuchao/ReinFlow/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4_seed3407/2025-05-10_21-40-08_3407
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Failed
-
tonghezhang01
1d 17h 26m 25s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0
4
cuda:2
cuda:2
4
280
1
kitchen-mixed-v0
false
false
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/yuchao/ReinFlow/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4_seed42/2025-05-10_21-40-08_42
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Finished
-
tonghezhang01
15h 38m 47s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0
4
cuda:3
cuda:3
4
280
1
kitchen-mixed-v0
false
false
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/yuchao/ReinFlow/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4_seed0/2025-05-10_21-40-08_0
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Failed
-
tonghezhang01
1d 17h 26m 26s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
9
-
256
1
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0
4
cuda:2
cuda:2
4
280
1
kitchen-mixed-v0
false
false
/home/yuchao/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
-
4
/home/yuchao/ReinFlow/log/gym/finetune/kitchen-mixed-v0_fql_mlp_ta4_td4_seed2025/2025-05-10_21-40-08_2025
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
9
-
-
1
512
4
-
60
-
-
-
Finished
-
tonghezhang01
22h 39m 29s
-
agent.finetune.dppo.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_diffusion_mlp_ta4_td20/2024-10-20_16-48-28_42/checkpoint/state_8000.pt
-
1
-
20
cuda:3
cuda:3
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
10
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_diffusion_mlp_ta4_td20_tdf10_seed509/2025-05-09_18-33-34_509
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
9
model.diffusion.mlp_diffusion.DiffusionMLP
9
60
[128,32]
-
-
4
[256,256,256]
-
true
16
-
Finished
-
tonghezhang01
22h 39m 12s
-
agent.finetune.dppo.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_diffusion_mlp_ta4_td20/2024-10-20_16-48-28_42/checkpoint/state_8000.pt
-
1
-
20
cuda:2
cuda:2
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
10
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_diffusion_mlp_ta4_td20_tdf10_seed2025/2025-05-09_18-33-25_2025
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
9
model.diffusion.mlp_diffusion.DiffusionMLP
9
60
[128,32]
-
-
4
[256,256,256]
-
true
16
-
Finished
-
tonghezhang01
3h 20m 42s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
-
1
-
4
cuda:5
cuda:5
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-09_18-33-05_seed509
0.12
0.05
model.flow.ft_ppo.pposhortcut.PPOShortCut
9
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
Finished
-
tonghezhang01
3h 15m 41s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
-
1
-
4
cuda:4
cuda:4
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-09_18-32-33_seed2025
0.12
0.05
model.flow.ft_ppo.pposhortcut.PPOShortCut
9
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
Finished
-
tonghezhang01
1d 1h 6m 24s
-
agent.finetune.dppo.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_diffusion_mlp_ta4_td20/2024-10-20_16-48-28_42/checkpoint/state_8000.pt
-
1
-
20
cuda:4
cuda:4
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
10
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_diffusion_mlp_ta4_td20_tdf10_seed3407/2025-05-09_15-38-28_3407
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
9
model.diffusion.mlp_diffusion.DiffusionMLP
9
60
[128,32]
-
-
4
[256,256,256]
-
true
16
-
Finished
-
tonghezhang01
1d 1h 7m 6s
-
agent.finetune.dppo.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_diffusion_mlp_ta4_td20/2024-10-20_16-48-28_42/checkpoint/state_8000.pt
-
1
-
20
cuda:1
cuda:1
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
10
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_diffusion_mlp_ta4_td20_tdf10_seed0/2025-05-09_15-38-28_0
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
9
model.diffusion.mlp_diffusion.DiffusionMLP
9
60
[128,32]
-
-
4
[256,256,256]
-
true
16
-
Finished
-
tonghezhang01
1h 9m 50s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
-
1
-
4
cuda:6
cuda:6
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-08_23-03-05_seed42
0.12
0.05
model.flow.ft_ppo.pposhortcut.PPOShortCut
9
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
Finished
-
tonghezhang01
1h 10m 50s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
-
1
-
4
cuda:7
cuda:7
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-08_23-02-13_seed42
0.12
0.05
model.flow.ft_ppo.pposhortcut.PPOShortCut
9
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
Finished
-
tonghezhang01
20s
-
agent.finetune.dppo.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_diffusion_mlp_ta4_td20/2024-10-20_16-48-28_42/checkpoint/state_8000.pt
-
1
-
20
cuda:5
cuda:5
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
10
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_diffusion_mlp_ta4_td20_tdf10/2025-05-08_20-34-31_42
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
9
model.diffusion.mlp_diffusion.DiffusionMLP
9
60
[128,32]
-
-
4
[256,256,256]
-
true
16
-
Finished
-
tonghezhang01
1h 13m 13s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
9
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
-
1
-
4
cuda:7
cuda:7
4
280
40
kitchen-mixed-v0
false
false
/home/zhangtonghe/ReinFlow/data/gym/kitchen-mixed-v0/normalization.npz
280
4
1
true
kitchen-mixed-v0
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/kitchen-mixed-v0_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-08_20-13-28_seed42
0.12
0.05
model.flow.ft_ppo.pposhortcut.PPOShortCut
9
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/kitchen-mixed-v0_pre_shortcut_mlp_ta4_td20/2025-05-08_03-11-00_42/checkpoint/state_2400.pt
1-17
of 17