Wmfrank's workspace
Runs
17
Name
1 visualized
Job Type: SF
Job Type: SF
1
State
Notes
User
Tags
Created
Runtime
Sweep
actor_critic_share_weights
actor_worker_gpus
adam_beta1
adam_beta2
adam_eps
adaptive_stddev
algo
async_rl
batch_size
batched_sampling
benchmark
cli_args.actor_worker_gpus
cli_args.algo
cli_args.batch_size
cli_args.env
cli_args.env_gpu_observations
cli_args.experiment
cli_args.exploration_loss
cli_args.exploration_loss_coeff
cli_args.gamma
cli_args.max_grad_norm
cli_args.megaverse_num_agents_per_env
cli_args.megaverse_num_envs_per_instance
cli_args.megaverse_num_simulation_threads
cli_args.megaverse_use_vulkan
cli_args.num_envs_per_worker
cli_args.num_epochs
cli_args.num_policies
cli_args.num_workers
cli_args.policy_workers_per_policy
cli_args.ppo_epochs
cli_args.recurrence
cli_args.reward_clip
cli_args.rnn_num_layers
cli_args.rollout
cli_args.train_for_env_steps
cli_args.train_for_seconds
cli_args.use_rnn
cli_args.wandb_group
cli_args.wandb_project
cli_args.wandb_tags
cli_args.with_pbt
cli_args.with_wandb
command_line
Finished
-
wmfrank
1d 1h 43m 50s
-
true
0
0.9
0.999
0.000001
true
APPO
true
4096
false
false
0
APPO
4096
TowerBuilding
false
TowerBuilding_real_sf2
symmetric_kl
0.001
0.997
0
1
32
1
true
2
1
1
12
2
-
32
30
2
32
2000000000
360000000
true
megaverse
megaverse-benchmark
real_sf2_test0
false
true
--train_for_seconds=360000000 --train_for_env_steps=2000000000 --algo=APPO --gamma=0.997 --use_rnn=True --rnn_num_layers=2 --num_workers=12 --num_envs_per_worker=2 --num_epochs=1 --rollout=32 --recurrence=32 --batch_size=4096 --actor_worker_gpus 0 --env_gpu_observations=False --num_policies=1 --with_pbt=False --max_grad_norm=0.0 --exploration_loss=symmetric_kl --exploration_loss_coeff=0.001 --megaverse_num_simulation_threads=1 --megaverse_num_envs_per_instance=32 --megaverse_num_agents_per_env=1 --megaverse_use_vulkan=True --policy_workers_per_policy=2 --reward_clip=30 --env=TowerBuilding --experiment=TowerBuilding_real_sf2 --with_wandb=True --wandb_project=megaverse-benchmark --wandb_group=megaverse --wandb_tags real_sf2_test0
Finished
-
wmfrank
1d 1h 43m 50s
-
true
0
0.9
0.999
0.000001
true
APPO
true
4096
false
false
0
APPO
4096
TowerBuilding
false
TowerBuilding_real_sf2
symmetric_kl
0.001
0.997
0
1
32
1
true
2
1
1
12
2
-
32
30
2
32
2000000000
360000000
true
megaverse
megaverse-benchmark
real_sf2_test0
false
true
--train_for_seconds=360000000 --train_for_env_steps=2000000000 --algo=APPO --gamma=0.997 --use_rnn=True --rnn_num_layers=2 --num_workers=12 --num_envs_per_worker=2 --num_epochs=1 --rollout=32 --recurrence=32 --batch_size=4096 --actor_worker_gpus 0 --env_gpu_observations=False --num_policies=1 --with_pbt=False --max_grad_norm=0.0 --exploration_loss=symmetric_kl --exploration_loss_coeff=0.001 --megaverse_num_simulation_threads=1 --megaverse_num_envs_per_instance=32 --megaverse_num_agents_per_env=1 --megaverse_use_vulkan=True --policy_workers_per_policy=2 --reward_clip=30 --env=TowerBuilding --experiment=TowerBuilding_real_sf2 --with_wandb=True --wandb_project=megaverse-benchmark --wandb_group=megaverse --wandb_tags real_sf2_test0
Finished
-
wmfrank
real_sf2_test1
1d 1h 43m 50s
-
true
[0]
0.9
0.999
0.000001
true
APPO
true
4096
false
false
[0]
APPO
4096
TowerBuilding
false
TowerBuilding_real_sf2
symmetric_kl
0.001
0.997
0
1
32
1
true
2
1
1
12
2
-
32
30
2
32
2000000000
360000000
true
megaverse
megaverse-benchmark
["real_sf2_test0"]
false
true
--train_for_seconds=360000000 --train_for_env_steps=2000000000 --algo=APPO --gamma=0.997 --use_rnn=True --rnn_num_layers=2 --num_workers=12 --num_envs_per_worker=2 --num_epochs=1 --rollout=32 --recurrence=32 --batch_size=4096 --actor_worker_gpus 0 --env_gpu_observations=False --num_policies=1 --with_pbt=False --max_grad_norm=0.0 --exploration_loss=symmetric_kl --exploration_loss_coeff=0.001 --megaverse_num_simulation_threads=1 --megaverse_num_envs_per_instance=32 --megaverse_num_agents_per_env=1 --megaverse_use_vulkan=True --policy_workers_per_policy=2 --reward_clip=30 --env=TowerBuilding --experiment=TowerBuilding_real_sf2 --with_wandb=True --wandb_project=megaverse-benchmark --wandb_group=megaverse --wandb_tags real_sf2_test0
1-1
of 1