Tonghezhang01's workspace
Runs
30
Name
30 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_target_
act_steps
action_dim
base_policy_path
batch_size
cond_steps
dataset_dir
denoising_steps
device
egl_device
env.best_reward_threshold_for_success
env.max_episode_steps
env.n_envs
env.name
env.reset_at_iteration
env.save_video
env.wrappers.mujoco_locomotion_lowdim.normalization_path
env.wrappers.multi_step.max_episode_steps
env.wrappers.multi_step.n_action_steps
env.wrappers.multi_step.n_obs_steps
env.wrappers.multi_step.reset_within_step
env_name
ft_denoising_steps
horizon_steps
logdir
max_std
min_std
model._target_
model.act_dim
model.act_max
model.act_min
model.action_dim
model.actor._target_
model.actor.action_dim
model.actor.activation_type
model.actor.cond_dim
model.actor.cond_steps
model.actor.hidden_dim
model.actor.horizon_steps
model.actor.mlp_dims
model.actor.obs_dim
model.actor.residual_style
model.actor.time_dim
model.actor_policy_path
Finished
-
tonghezhang01
10h 19m 58s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
log_gym_d4rl/Humanoid-medium-v3/Shortcut/state_60.pt
-
1
-
4
cuda:1
cuda:1
3
1000
40
Humanoid-medium-v3
false
false
gym_d4rl_normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/yuchao/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-22_13-53-36_seed3407
0.16
0.08
model.flow.ft_ppo.pposhortcut.PPOShortCut
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/Humanoid-medium-v3/Shortcut/state_60.pt
Finished
-
tonghezhang01
9h 1m 52s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
log_gym_d4rl/Humanoid-medium-v3/Shortcut/state_60.pt
-
1
-
4
cuda:6
cuda:6
3
1000
40
Humanoid-medium-v3
false
false
gym_d4rl_normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/yuchao/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-22_13-53-37_seed42
0.16
0.08
model.flow.ft_ppo.pposhortcut.PPOShortCut
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/Humanoid-medium-v3/Shortcut/state_60.pt
Finished
-
tonghezhang01
9h 32s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
log_gym_d4rl/Humanoid-medium-v3/Shortcut/state_60.pt
-
1
-
4
cuda:5
cuda:5
3
1000
40
Humanoid-medium-v3
false
false
gym_d4rl_normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/yuchao/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_shortcut_mlp_ta4_td4_tdf4/2025-05-22_13-53-36_seed0
0.16
0.08
model.flow.ft_ppo.pposhortcut.PPOShortCut
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
log_gym_d4rl/Humanoid-medium-v3/Shortcut/state_60.pt
Finished
-
tonghezhang01
42m 10s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/1-ReFlow/state_100.pt
-
1
-
4
cuda:7
cuda:7
3
1000
40
Humanoid-medium-v3
false
false
/nvme_data/tonghe/dppo-main/gym-d4rl-normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/nvme_data/tonghe/dppo-main/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-22_05-20-23_seed42
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/1-ReFlow/state_100.pt
Finished
-
tonghezhang01
44m 39s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/1-ReFlow/state_100.pt
-
1
-
4
cuda:1
cuda:1
3
1000
40
Humanoid-medium-v3
false
false
/nvme_data/tonghe/dppo-main/gym-d4rl-normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/nvme_data/tonghe/dppo-main/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-22_05-20-23_seed0
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/1-ReFlow/state_100.pt
Finished
-
tonghezhang01
1h 25m 40s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/1-ReFlow/state_100.pt
-
1
-
4
cuda:0
cuda:0
3
1000
40
Humanoid-medium-v3
false
false
/nvme_data/tonghe/dppo-main/gym-d4rl-normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/nvme_data/tonghe/dppo-main/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-22_05-20-23_seed3407
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/1-ReFlow/state_100.pt
Finished
-
tonghezhang01
17h 21m 59s
-
agent.finetune.reinflow.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
17
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/DDPM/state_120.pt
-
1
-
20
cuda:2
cuda:2
3
1000
40
Humanoid-medium-v3
false
false
/nvme_data/tonghe/dppo-main/gym-d4rl-normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
10
4
/nvme_data/tonghe/dppo-main/log/gym/finetune/Humanoid-medium-v3_ppo_diffusion_mlp_ta4_td4_d4rl_seed3407/2025-05-22_05-16-38_3407
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
17
model.diffusion.mlp_diffusion.DiffusionMLP
17
ReLU
376
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
17h 18m 16s
-
agent.finetune.reinflow.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
17
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/DDPM/state_120.pt
-
1
-
20
cuda:3
cuda:3
3
1000
40
Humanoid-medium-v3
false
false
/nvme_data/tonghe/dppo-main/gym-d4rl-normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
10
4
/nvme_data/tonghe/dppo-main/log/gym/finetune/Humanoid-medium-v3_ppo_diffusion_mlp_ta4_td4_d4rl_seed0/2025-05-22_05-16-26_0
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
17
model.diffusion.mlp_diffusion.DiffusionMLP
17
ReLU
376
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
17h 18m 40s
-
agent.finetune.reinflow.train_ppo_diffusion_agent.TrainPPODiffusionAgent
4
17
/nvme_data/tonghe/dppo-main/log_gym_d4rl/Humanoid-medium-v3/DDPM/state_120.pt
-
1
-
20
cuda:4
cuda:4
3
1000
40
Humanoid-medium-v3
false
false
/nvme_data/tonghe/dppo-main/gym-d4rl-normalization/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
10
4
/nvme_data/tonghe/dppo-main/log/gym/finetune/Humanoid-medium-v3_ppo_diffusion_mlp_ta4_td4_d4rl_seed42/2025-05-22_05-16-09_42
-
-
model.diffusion.diffusion_ppo.PPODiffusion
-
-
-
17
model.diffusion.mlp_diffusion.DiffusionMLP
17
ReLU
376
-
-
4
[512,512,512]
-
true
16
-
Finished
-
tonghezhang01
3h 54m 20s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:5
cuda:5
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_11-29-11_seed42
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
3h 54m 18s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:4
cuda:4
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_11-29-11_seed0
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
3h 54m 18s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:6
cuda:6
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_11-29-11_seed3407
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
7h 48m 19s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:6
cuda:6
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_00-40-29_seed3407
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
7h 48m 20s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:5
cuda:5
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_00-40-29_seed42
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
7h 48m 23s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:4
cuda:4
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_00-40-30_seed0
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
7h 48m 23s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:7
cuda:7
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_00-32-46_seed42
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
7h 48m 23s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:7
cuda:7
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_00-32-45_seed0
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
7h 48m 23s
-
agent.finetune.reinflow.train_ppo_flow_agent.TrainPPOFlowAgent
4
17
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
-
1
-
4
cuda:7
cuda:7
3
1000
40
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data/gym/Humanoid-medium-v3/normalization.npz
1000
4
1
true
Humanoid-medium-v3
4
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_ppo_reflow_mlp_ta4_td4_tdf4/2025-05-13_00-32-46_seed3407
0.16
0.08
model.flow.ft_ppo.ppoflow.PPOFlow
17
1
-1
-
-
-
-
-
-
-
-
-
-
-
-
/home/zhangtonghe/ReinFlow/log/gym/pretrain/Humanoid-v3_pre_reflow_mlp_ta4_td20/2025-05-01_18-18-08_42/checkpoint/state_50.pt
Finished
-
tonghezhang01
1d 14h 48m 46s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
17
-
256
1
/home/zhangtonghe/ReinFlow/data-offline/gym/Humanoid-medium-v3-offline/
4
cuda:1
cuda:1
3
1000
1
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data-offline/gym/Humanoid-medium-v3-offline//normalization.npz
1000
4
1
true
Humanoid-medium-v3
-
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_fql_mlp_ta4_seed0/2025-05-10_20-54-05_0
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
17
-
-
1
512
4
-
376
-
-
-
Finished
-
tonghezhang01
1d 18h 16m 55s
-
agent.finetune.flow_baselines.train_fql_agent.TrainFQLAgent
4
17
-
256
1
/home/zhangtonghe/ReinFlow/data-offline/gym/Humanoid-medium-v3-offline/
4
cuda:2
cuda:2
3
1000
1
Humanoid-medium-v3
false
false
/home/zhangtonghe/ReinFlow/data-offline/gym/Humanoid-medium-v3-offline//normalization.npz
1000
4
1
true
Humanoid-medium-v3
-
4
/home/zhangtonghe/ReinFlow/log/gym/finetune/Humanoid-medium-v3_fql_mlp_ta4_seed3407/2025-05-10_20-54-05_3407
-
-
model.flow.ft_baselines.fql.FQLModel
-
-
-
-
model.flow.ft_baselines.fql.OneStepActor
17
-
-
1
512
4
-
376
-
-
-
1-20
of 30