Tgdivy's workspace
Runs
153
Name
23 visualized
env
model
full_communication_3
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_2
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_2
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_4
ppo_shared_global_critic_rec
full_communication_3
ppo_shared_future
full_communication_2
ppo_shared_global_critic_rec
Notes
Runtime
State
Tags
num_envs
total_timesteps
wandb
load_weights_name
video
bs
gru_hidden_size
gru_layers
hidden_size
learn_n
n_agents
total_episodes
comm/symbols_per_ep
comm/vocab_size
dev/End_reward
dev/Episode_return
losses/approx_kl
losses/clipfrac
losses/entropy
losses/explained_variance
losses/policy_loss
losses/value_loss
dev/agent_2
losses/approx_kl_agent_0
losses/approx_kl_agent_1
losses/clipfrac_agent_0
losses/clipfrac_agent_1
losses/entropy_agent_0
losses/entropy_agent_1
losses/explained_variance_agent_0
losses/explained_variance_agent_1
losses/policy_loss_agent_0
losses/policy_loss_agent_1
losses/value_loss_agent_0
losses/value_loss_agent_1
losses/approx_kl_agent_2
losses/clipfrac_agent_2
losses/entropy_agent_2
losses/explained_variance_agent_2
losses/policy_loss_agent_2
losses/value_loss_agent_2
comm/symbols_per_ep_agent_3
29m 48s
Finished
512
12500
true
/ppo_shared_global_critic_rec-full_communication_3-no_save_norm_comm5
true
-
-
-
-
-
-
-
8.27333
2
-0.10818
-8.72716
0.02037
0.071651
1.25056
0.85023
-0.0023277
0.89175
-0.12303
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2h 51m 20s
Crashed
512
100000
true
-
false
-
-
-
-
-
-
-
9.60667
2
-0.11108
-8.96518
0.011119
0
1.24226
0.91506
7.9473e-10
0.034131
-0.11635
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
20s
Failed
512
1000
true
/ppo_shared_global_critic_rec-full_communication_3-no_save_norm_comm5
false
-
-
-
-
-
-
-
6.90667
2
-0.11366
-9.25373
-
-
-
-
-
-
-0.10639
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
3h 32m 5s
Finished
1024
50000
true
-
false
-
-
-
-
-
-
-
10.26667
2
-0.118
-9.42537
0.0054827
0.043324
0.99883
0.94837
-0.0027161
0.21359
-0.11234
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
5m 26s
Finished
512
6250
true
/ppo_shared_global_critic_rec-full_communication_3-no_save_norm_comm5
false
-
-
-
-
-
-
-
8.2
2
-0.12172
-8.5248
0.010221
0.049599
1.21999
0.92229
-0.0007525
0.15214
-0.11908
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
16m 17s
Finished
512
6250
true
/ppo_shared_global_critic_rec-full_communication_3-no_save_norm_comm5
true
-
-
-
-
-
-
-
9.14667
2
-0.12759
-9.03908
0.010094
0.053919
1.24998
0.93436
-0.0013769
0.13868
-0.1284
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2h 15m 45s
Crashed
512
100000
true
-
false
-
-
-
-
-
-
-
10.4
2
-0.13744
-10.61404
0.044984
0
0.56647
0.96962
-3.5763e-10
0.018655
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
6m 44s
Finished
512
12500
true
/ppo_shared_global_critic_rec-full_communication_3-no_save_norm_comm5
true
-
-
-
-
-
-
-
14
2
-0.252
-10.86444
0.041281
0
1.20363
0.838
-2.0663e-9
0.1462
-0.25385
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
13m 7s
Killed
256
25000
true
-
true
-
-
-
-
-
-
-
7.17
2
-0.25469
-10.58973
0.0083064
0.083984
1.02243
0.95156
-0.0040032
0.2037
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
17m 56s
Finished
512
12500
true
/ppo_shared_global_critic_rec-full_communication_3-no_save_norm_comm5
true
-
-
-
-
-
-
-
4.84
2
-0.28631
-11.73218
0.032835
0
1.10077
0.79095
1.4305e-9
0.14073
-0.27977
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
5h 17m 31s
Finished
512
100000
true
-
false
-
-
-
-
-
-
-
10.08
2
-0.39986
-14.28569
0.0090801
0.051264
1.17496
0.94783
-0.0067947
0.45741
-0.41218
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
10.52
3h 22m 21s
Crashed
512
150000
true
-
false
-
-
-
-
-
-
-
9.365
2
-0.43446
-13.58763
0.005856
0.041811
1.12507
0.96318
-0.0042514
0.38813
-0.39911
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
8.22
2h 54m 59s
Failed
1024
100000
true
-
true
-
-
-
-
-
-
-
10.535
2
-0.44688
-14.93175
0.0083996
0.05914
1.31143
0.9501
-0.0073542
0.48153
-0.43244
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
11.2
2h 11m 13s
Failed
1024
50000
true
-
true
-
-
-
-
-
-
-
6.14667
2
-0.5805
-16.29617
0.0040491
0.033311
1.22217
0.97316
-0.0021549
0.3063
-0.58016
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
7h 55m 40s
Finished
512
150000
true
-
false
-
-
-
-
-
-
-
11.865
2
-0.58929
-17.74291
0.0059136
0.034547
1.24361
0.94391
-0.0055707
0.75406
-0.56805
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
13.2
2h 28m 43s
Failed
512
100000
true
-
true
-
-
-
-
-
-
-
8.43
2
-0.64304
-18.33676
0.0096061
0.062277
1.46509
0.97594
-0.0094054
0.38371
-0.6602
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
8.7
18h 36m 57s
Finished
256
200000
true
-
true
-
-
-
-
-
-
-
10.23
2
-0.64681
-17.88856
0.11234
0.12578
0.92058
0.97228
-0.018879
0.33581
-0.62234
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
10.62
36m 45s
Crashed
1024
100000
true
-
false
-
-
-
-
-
-
-
8.605
2
-0.66743
-17.94123
0.0039348
0.017811
1.65686
0.97974
-0.0017513
0.29033
-0.6365
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
8.82
40m 19s
Finished
512
75000
true
-
true
-
-
-
-
-
-
-
4.76667
2
-0.66779
-18.35022
0.0040377
0.022872
1.50724
0.97971
-0.0012753
0.27718
-0.68131
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
16m 58s
Finished
256
25000
true
-
true
-
-
-
-
-
-
-
7.58
2
-0.68976
-18.06385
0.0086742
0.06375
1.46836
0.97793
-0.0071137
0.31381
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
1-20
of 23