Tonghezhang01's workspace
Runs
32
Name
32 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_target_
act_steps
action_dim
base_policy_path
batch_size
cond_steps
dataset_dir
denoising_steps
device
egl_device
env.best_reward_threshold_for_success
env.max_episode_steps
env.n_envs
env.name
env.reset_at_iteration
env.save_video
env.wrappers.mujoco_locomotion_lowdim.normalization_path
env.wrappers.multi_step.max_episode_steps
env.wrappers.multi_step.n_action_steps
env.wrappers.multi_step.n_obs_steps
env.wrappers.multi_step.reset_within_step
env_name
ft_denoising_steps
horizon_steps
logdir
max_std
min_std
model._target_
model.act_dim
model.act_max
model.act_min
model.action_dim
model.actor._target_
model.actor.action_dim
model.actor.activation_type
model.actor.cond_dim
model.actor.cond_steps
model.actor.hidden_dim
model.actor.horizon_steps
model.actor.mlp_dims
model.actor.obs_dim
model.actor.residual_style
model.actor.time_dim
model.actor_policy_path
Finished
-
tonghezhang01
2h 28m 43s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
log_gym_d4rl/walker2d-medium-v2/Shortcut/state_40.pt
-
1
-
4
cuda:3
cuda:3
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/yuchao/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-22_13-43-34_seed0
0.24
0.1
model.flow.ft_ppo.pposhortcut.PPOShortCut
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/walker2d-medium-v2/Shortcut/state_40.pt
Finished
-
tonghezhang01
13h 6m 46s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
log_gym_d4rl/walker2d-medium-v2/Shortcut/state_40.pt
-
1
-
4
cuda:2
cuda:2
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/yuchao/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-22_13-43-34_seed3407
0.24
0.1
model.flow.ft_ppo.pposhortcut.PPOShortCut
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/walker2d-medium-v2/Shortcut/state_40.pt
Finished
-
tonghezhang01
1d 3m 59s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
log_gym_d4rl/walker2d-medium-v2/Shortcut/state_40.pt
-
1
-
4
cuda:4
cuda:4
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/yuchao/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-22_13-43-34_seed42
0.24
0.1
model.flow.ft_ppo.pposhortcut.PPOShortCut
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/walker2d-medium-v2/Shortcut/state_40.pt
Finished
-
tonghezhang01
7h 31m 48s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
log_gym_d4rl/walker2d-medium-v2/1-ReFlow/state_80.pt
-
1
-
4
cuda:5
cuda:5
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/yuchao/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-22_13-34-39_seed3407
0.24
0.1
model.flow.ft_ppo.ppoflow.PPOFlow
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/walker2d-medium-v2/1-ReFlow/state_80.pt
Finished
-
tonghezhang01
7h 14m 55s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
log_gym_d4rl/walker2d-medium-v2/1-ReFlow/state_80.pt
-
1
-
4
cuda:6
cuda:6
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/yuchao/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-22_13-34-28_seed0
0.24
0.1
model.flow.ft_ppo.ppoflow.PPOFlow
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/walker2d-medium-v2/1-ReFlow/state_80.pt
Finished
-
tonghezhang01
5h 26m 14s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
log_gym_d4rl/walker2d-medium-v2/1-ReFlow/state_80.pt
-
1
-
4
cuda:7
cuda:7
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/yuchao/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-22_13-33-28_seed42
0.24
0.1
model.flow.ft_ppo.ppoflow.PPOFlow
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/walker2d-medium-v2/1-ReFlow/state_80.pt
Finished
-
tonghezhang01
1d 2h 1m 37s
-
agent.finetune.reinflow.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
6
log_gym_d4rl/walker2d-medium-v2/DDPM/state_60.pt
-
1
-
20
cuda:1
cuda:1
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/gym-d4rl-normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
10
4
/home/zhangtonghe/dppo/log/gym/finetune/walker2d-medium-v2_ppo_diffusion_mlp_ta4_td4_d4rl_seed0/2025-05-22_11-41-25_seed0
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
6
model.diffusion.mlp_diffusion.DiffusionMLP
6
ReLU
17
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
1d 1h 50m 4s
-
agent.finetune.reinflow.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
6
log_gym_d4rl/walker2d-medium-v2/DDPM/state_60.pt
-
1
-
20
cuda:0
cuda:0
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/gym-d4rl-normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
10
4
/home/zhangtonghe/dppo/log/gym/finetune/walker2d-medium-v2_ppo_diffusion_mlp_ta4_td4_d4rl_seed3407/2025-05-22_11-41-25_seed3407
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
6
model.diffusion.mlp_diffusion.DiffusionMLP
6
ReLU
17
-
-
4
[512,512,512]
-
true
16
-
Crashed
-
tonghezhang01
1d 5h 51m 26s
-
agent.finetune.reinflow.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
6
log_gym_d4rl/walker2d-medium-v2/DDPM/state_60.pt
-
1
-
20
cuda:7
cuda:7
3
1000
40
walker2d-medium-v2
false
false
gym_d4rl_normalization/gym-d4rl-normalization/walker-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
10
4
/home/zhangtonghe/dppo/log/gym/finetune/walker2d-medium-v2_ppo_diffusion_mlp_ta4_td4_d4rl_seed42/2025-05-22_11-41-25_seed42
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
6
model.diffusion.mlp_diffusion.DiffusionMLP
6
ReLU
17
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
2d 15h 56m 23s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
6
-
256
1
/home/zhangtonghe/ReinFlow/data-offline/gym/walker2d-medium-v2
4
cuda:2
cuda:2
3
1000
1
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data-offline/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
-
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_fql_mlp_ta4_td4_seed3407/2025-05-10_13-16-07_3407
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
6
-
-
1
512
4
-
17
-
-
-
Finished
-
tonghezhang01
2d 15h 56m 12s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
6
-
256
1
/home/zhangtonghe/ReinFlow/data-offline/gym/walker2d-medium-v2
4
cuda:2
cuda:2
3
1000
1
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data-offline/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
-
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_fql_mlp_ta4_td4_seed0/2025-05-10_13-16-07_0
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
6
-
-
1
512
4
-
17
-
-
-
Finished
-
tonghezhang01
9h 11m 29s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
6
-
256
1
/home/zhangtonghe/ReinFlow/data-offline/gym/walker2d-medium-v2
4
cuda:2
cuda:2
3
1000
1
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data-offline/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
-
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_fql_mlp_ta4_td4/2025-05-09_11-54-21_42
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
6
-
-
1
512
4
-
17
-
-
-
Finished
-
tonghezhang01
49s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
tonghezhang01
43s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
tonghezhang01
49s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
tonghezhang01
1d 40m 1s
-
agent.finetune.mine.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
6
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-medium-v2_pre_diffusion_mlp_ta4_td20/2024-06-12_23-06-12/checkpoint/state_3000.pt
-
1
-
20
cuda:6
-
3
1000
40
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_diffusion_DDIM_4steps_seed3407/2025-04-29_20-43-19_seed3407
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
6
model.diffusion.mlp_diffusion.DiffusionMLP
6
ReLU
17
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
1d 1h 23m 29s
-
agent.finetune.mine.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
6
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-medium-v2_pre_diffusion_mlp_ta4_td20/2024-06-12_23-06-12/checkpoint/state_3000.pt
-
1
-
20
cuda:7
-
3
1000
40
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_diffusion_DDIM_4steps_seed0/2025-04-29_20-43-13_seed0
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
6
model.diffusion.mlp_diffusion.DiffusionMLP
6
ReLU
17
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
7h 45m 26s
-
agent.finetune.mine.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-v2/ReFlow/2025-02-06_01-39-14_42_state_1500.pt
-
1
-
4
cuda:7
-
3
1000
40
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_reflow_mlp_ta4_td4_tdf4/2025-04-28_22-04-39_seed3407
0.24
0.1
model.flow.ft_ppo.ppoflow.PPOFlow
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-v2/ReFlow/2025-02-06_01-39-14_42_state_1500.pt
Finished
-
tonghezhang01
7h 52m 21s
-
agent.finetune.mine.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-v2/ReFlow/2025-02-06_01-39-14_42_state_1500.pt
-
1
-
4
cuda:6
-
3
1000
40
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_reflow_mlp_ta4_td4_tdf4/2025-04-28_22-04-31_seed42
0.24
0.1
model.flow.ft_ppo.ppoflow.PPOFlow
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-v2/ReFlow/2025-02-06_01-39-14_42_state_1500.pt
Finished
-
tonghezhang01
7h 59m 36s
-
agent.finetune.mine.train_ppo_flow_agent.TrainPPOFlowAgent
4
6
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-v2/ReFlow/2025-02-06_01-39-14_42_state_1500.pt
-
1
-
4
cuda:5
-
3
1000
40
walker2d-medium-v2
false
false
/home/zhangtonghe/ReinFlow/data/gym/walker2d-medium-v2/normalization.npz
1000
4
1
true
walker2d-medium-v2
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/walker2d-medium-v2_ppo_reflow_mlp_ta4_td4_tdf4/2025-04-28_22-04-18_seed0
0.24
0.1
model.flow.ft_ppo.ppoflow.PPOFlow
6
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/walker2d-v2/ReFlow/2025-02-06_01-39-14_42_state_1500.pt
1-20
of 32