Last active
October 13, 2022 08:19
-
-
Save cool-RR/0b7044daeaeacd3ed6c859e3dc0c1afb to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
algorithm.iteration=248 | |
results['episode_reward_mean']=185522.60799999998 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.348 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.333 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.130 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.197 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.141 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.278 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.173 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.416 | |
Sample game: | |
[ 3 0 a b 1 2 ] | |
[ 3 0 a b 1 2 ] | |
[ 3 0 a b 1 2 ] | |
[3 0 a b 1 2 ] | |
[ 0 a b 1 2 3] | |
[0 a b 1 2 3 ] | |
[ a b 1 2 3 0] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 1 2 3 0 ] | |
[ a b 12 3 0 ] | |
[ a b 12 3 0 ] | |
[ a b 213 0 ] | |
[ a b *10 ] | |
[ a b * 01 ] | |
[ a b 3 *1 ] | |
[ a b * 1 ] | |
[ a b * 21 ] | |
[ a b * 21 ] | |
[ a b *12 ] | |
[ a b * 21 ] | |
[ a b *12 ] | |
[ a b * 12 ] | |
[ a b 3 012 ] | |
[ a b * 21 ] | |
[ a b 3 012 ] | |
[ a b * 21 ] | |
[ a b * 21 ] | |
[ a b *12 ] | |
[ a b * 21 ] | |
[ a b 3 012 ] | |
[ a b 3 *1 ] | |
[ a b 3 0 21 ] | |
[ a b * 21 ] | |
[ a b 3 *1 ] | |
[a b 3 0 21 ] | |
[a b 3 * 1 ] | |
[a b 3 * 1 ] | |
[ b 3 0 2 1 a] | |
[ b 3 * 1 a] | |
[ b 3 * 1 a] | |
[ b 3 *1 a ] | |
[ b 3 2 01 a] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a] | |
[ b 3 2 01 a] | |
[ b 3 2 10 a] | |
[ b 3 2 01 a] | |
[ b 3 2 01 a] | |
[ b 3 2 01 a] | |
[ b 3 2 01 a] | |
[ b 3 2 01 a] | |
[ b 3 210 a] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b * 21 a ] | |
[ b 3 *1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 *1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b * 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 *1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 *1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 0 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b * 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 *1 a ] | |
[ b 3 0 21 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b * 1 a ] | |
[ b 2 * 1 a ] | |
[ b * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 01 a ] | |
[ b 3 210 a ] | |
[ b 3 *1 a ] | |
[ b 3 *1 a ] | |
[ b 3 210 a ] | |
[ b 3 210 a ] | |
[ b 3 2 01 a ] | |
[ b 3 210 a ] | |
[ b 3 210 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 01 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 2 10 a ] | |
[ b 3 210 a ] | |
[ b 3 210 a ] | |
[ b 3 2 01 a ] | |
[ b 3 210 a ] | |
[ b 3 210 a ] | |
[ b 3 *1 a ] | |
algorithm.iteration=249 | |
results['episode_reward_mean']=185430.82799999998 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.350 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.334 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.127 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.196 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.138 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.276 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.170 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.424 | |
Sample game: | |
[ 3 b a 1 0 2 ] | |
[ 3b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[ 3 b a 1 0 2 ] | |
[3 b a 1 0 2 ] | |
[ b a 1 0 2 3] | |
[ b a 1 0 2 3 ] | |
[ b a 1 0 2 3 ] | |
[ b a 1 0 2 3 ] | |
[ b a 1 0 2 3 ] | |
[ b a * 2 3 ] | |
[ b a * 2 3 ] | |
[ b a * 2 3 ] | |
[ b a 0 * 3 ] | |
[ b a 0 * 3 ] | |
[ b a 0 *3 ] | |
[ b a 0 132 ] | |
[ b a 0 31 2 ] | |
[ b a 031 2 ] | |
[ b a 30 1 2 ] | |
[ b a 30 1 2 ] | |
[ b a 03 * ] | |
[ b a 30 1 2 ] | |
[ b a 03 * ] | |
[ b a 30 1 2 ] | |
[ b a 031 2 ] | |
[ b a 30 1 2 ] | |
[ b a 03 * ] | |
[ b a 30 1 2 ] | |
[ b a 031 2 ] | |
[ b a 30 1 2 ] | |
[ b a 3* 2 ] | |
[ b a 30 * ] | |
[ b a 031 2 ] | |
[ b a 30 * ] | |
[ b a 031 2 ] | |
[ b a 30 * ] | |
[ b a 30 1 2 ] | |
[ b a 03 * ] | |
[ b a 031 2 ] | |
[ b a 03 * ] | |
[ b a 031 2 ] | |
[ b a 03 * ] | |
[ b a 0 31 2 ] | |
[ b a 0 3 * ] | |
[ b a 0 31 2 ] | |
[ b a 03 * ] | |
[ b a 0 3 * ] | |
[ b a 0 31 2 ] | |
[ b a 0 3 * ] | |
[ b a 0 3 * ] | |
[ b a 0 31 2 ] | |
[ b a 0 3 * ] | |
[ b a 0 3 * ] | |
[ b a 03 * ] | |
[ b a 03 1 2 ] | |
[ b a 30 1 2 ] | |
[ b a 03 * ] | |
[ b a 30 * ] | |
[ b a 3 0 * ] | |
[ b a 30 1 2 ] | |
[ b a 3 0 1 2 ] | |
[ b a 30 1 2 ] | |
[ b a 3 0 * ] | |
[ b a 3 0 * ] | |
[b a 30 * ] | |
[ b a 3 0 2 1 ] | |
[b a 3 0 * ] | |
[b a 30 * ] | |
[b a 30 2 1 ] | |
[b a 30 2 1 ] | |
[ a 30 2 1 b] | |
[ a 032 1 b] | |
[ a 0 23 1 b] | |
[ a 0 23 1 b] | |
[ a *3 1 b] | |
[ a 2 03 1 b ] | |
[ a 2 03 1 b ] | |
[ a2 30 1 b ] | |
[ * 30 1 b ] | |
[ 2a 30 1 b ] | |
[ 2 a 30 1b ] | |
[ 2 a30 * ] | |
[ 2*0 b 1 ] | |
[ 2 0* b 1] | |
[1 2 0 a3 b ] | |
[ 1 * * b ] | |
[ 1 * 3a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ * 23 a b ] | |
[ 0 *3 a b ] | |
[ *32 a b ] | |
[ 03* a b ] | |
[ 3* 2 a b ] | |
[ 30 * a b ] | |
[ 3 * a b ] | |
[ 3 * a b ] | |
[ 3 2 * a b ] | |
[ 32 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 32 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 32 0 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 30 2 1 a b ] | |
[ 30 2 1 a b ] | |
[ 3 * 1 a b ] | |
[ 30 2 1 a b ] | |
[ 3 * 1 a b ] | |
[ 30 2 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 32 0 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3* 1 a b ] | |
[ 30 2 1 a b ] | |
[ 3* 1 a b ] | |
[ 30 * a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3* 1 a b ] | |
[ 30 2 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[3 2 * a b ] | |
[ 3 2 * a b ] | |
[3 2 0 1 a b ] | |
[ 2 * a b 3] | |
[3 2 0 1 a b ] | |
[ 2 * a b 3] | |
[3 2 0 1 a b ] | |
[ 32 * a b ] | |
[3 2 0 1 a b ] | |
[ 32 * a b ] | |
[3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[3 2 0 1 a b ] | |
[ 32 * a b ] | |
[3 2 0 1 a b ] | |
[ 2 * a b 3] | |
[3 2 * a b ] | |
[ 2 0 1 a b 3] | |
[3 2 * a b ] | |
[ 2 0 1 a b 3] | |
[3 2 * a b ] | |
[ 2 0 1 a b 3] | |
[3 2 0 1 a b ] | |
[ 2 0 1 a b 3] | |
[3 2 * a b ] | |
[ 2 0 1 a b 3] | |
[3 2 0 1 a b ] | |
[ 2 0 1 a b 3] | |
[3 2 0 1 a b ] | |
[ 2 0 1 a b 3] | |
[3 2 * a b ] | |
[ 2 0 1 a b 3] | |
[3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 * 1 a b ] | |
[ 3 2 0 1 a b ] | |
[3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 32 0 1 a b ] | |
[ 32 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 * 1 a b ] | |
[ 3 * 1 a b ] | |
[ 3 2 * a b ] | |
algorithm.iteration=250 | |
results['episode_reward_mean']=185470.48 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.347 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.347 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.123 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.191 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.146 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.273 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.165 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.425 | |
Sample game: | |
[ b1 a 0 3 2 ] | |
[ b1 a 0 3 2 ] | |
[ * a 0 3 2 ] | |
[ 1b a 0 3 2 ] | |
[ 1 b a 0 3 2 ] | |
[ 1 b a 0 3 2 ] | |
[ 1 b a 0 3 2 ] | |
[ 1 b a 0 32 ] | |
[ 1 b a 0 32 ] | |
[1 b a 0 32 ] | |
[ b a 0 32 1] | |
[ b a 0 32 1 ] | |
[ b a 0 3 2 1 ] | |
[ b a 0 32 1 ] | |
[ b a 0 23 1 ] | |
[ b a 0 32 1 ] | |
[ b a 0 32 1 ] | |
[ b a 0 23 1 ] | |
[ b a 0 23 1 ] | |
[ b a 0 23 1 ] | |
[ b a 0 23 1 ] | |
[ b a 0 2 31 ] | |
[ b a * 31 ] | |
[ b a * 31 ] | |
[ b a 0 2 13 ] | |
[ b a 0 2 13 ] | |
[ b a * 13 ] | |
[ b a 2 0 1 3 ] | |
[ b a * 1 3 ] | |
[b a * 1 3 ] | |
[b a 2 0 1 3 ] | |
[b a 2 0 13 ] | |
[b a 2 0 13 ] | |
[b a 2 0 31 ] | |
[ a 2 0 31 b] | |
[ a * 3 1 b] | |
[ a * 3 1 b] | |
[ a * 3 1 b ] | |
[ a * 3 1 b ] | |
[ a * 3 1 b ] | |
[ a 2 0 3 1 b ] | |
[ a 2 0 3 1 b ] | |
[ a 2 0 3 1 b ] | |
[ a 2 0 3 1 b ] | |
[ a 2 0 3 1b ] | |
[ a 2 0 3 b1 ] | |
[ a2 0 3 b 1] | |
[1 2a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a 0 3 b ] | |
[ 1 2 a0 3 b ] | |
[ 1 2 * 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ * 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ * 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 * a 3 b ] | |
[ * 2 a 3 b ] | |
[ 1 * a 3 b ] | |
[ * 2 a 3 b ] | |
[ 1 * a 3 b ] | |
[ 1 * a 3 b] | |
[ * 2 a3 b ] | |
[ * 2 a 3 b] | |
[ 1 0 2 a3 b] | |
[ 1 0 2 * b] | |
[b * 2 3a ] | |
[b 1 0 2 3 a ] | |
[b 1 * 3 a ] | |
[ b 1 0 2 3 a ] | |
[ b 1 0 2 3 a ] | |
[ b * 2 3 a ] | |
[ b * 3 a ] | |
[ b 1 * 3 a ] | |
[ b 1 * 3 a ] | |
[ b 1 * 3 a ] | |
[ b 1 0 2 3 a ] | |
[ b 1 * 3 a ] | |
[ b * 2 3 a ] | |
[ b 1 * 3 a ] | |
[ b 1 * 3 a ] | |
[ b 1 * 3 a ] | |
[ b * 23 a ] | |
[ b 1 *3 a ] | |
[ b 13* a ] | |
[ b 132 0 a ] | |
[ b 3* 0 a ] | |
[ b 3 * 0 a ] | |
[ b 3 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 * a ] | |
[ b 3 2 * a ] | |
[ b 32 * a ] | |
[ b 32 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 32 * a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 * 0 a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 1 0 a ] | |
[ b 32 * a ] | |
[ b 32 0 1 a ] | |
[ b 23 0 1 a ] | |
[ b 23 * a ] | |
[ b 32 * a ] | |
[ b 32 0 1 a ] | |
[ b 32 * a ] | |
[ b 3 2 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 3 2 * a ] | |
[ b 32 * a ] | |
[ b 23 0 1 a ] | |
[ b 23 * a ] | |
[ b 23 * a ] | |
[ b 23 * a ] | |
[ b 23 * a ] | |
[ b 2 3 * a ] | |
[ b 23 * a ] | |
[ b 23 * a ] | |
[ b 230 1 a ] | |
[ b 230 1 a ] | |
[ b *3 1 a ] | |
[ b * 31 a ] | |
[ b 2 0 13 a ] | |
[ b * 13 a ] | |
[ b 2 0 13 a ] | |
[ b 2 * 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 03 a ] | |
[ b * 03 a ] | |
[ b * 03 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b 2 1 0 3 a ] | |
[ b * 03 a ] | |
[ b 1 2 30 a ] | |
[ b 1 2 30 a ] | |
[ * 2 3 0 a ] | |
[ 1b 2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 2 30 a ] | |
[ 1 b 2 03 a ] | |
[ 1 b2 30 a ] | |
[ 1 b 2 30 a ] | |
[ 1 b2 30 a ] | |
[ 1 2b 30 a ] | |
[ 1 2 b 3 0 a ] | |
[ 1 2 b 3 0 a ] | |
[ 1 2 b 3 0 a ] | |
[ 1 2 b 3 0 a ] | |
[ 1 2b 3 0 a ] | |
[ 1 * 3 0 a ] | |
[ 1 b2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 2 3 0 a ] | |
[ 1 b 23 0 a ] | |
[ 1 b 32 0 a ] | |
[ 1 b 3 2 0 a ] | |
[ 1 b 3 2 0 a ] | |
[ 1 b 3 2 0 a ] | |
[ 1 b 3 2 0 a ] | |
[ 1 b3 2 0 a ] | |
[ 1 * 2 0 a ] | |
[ 1 3b 2 0 a] | |
[ 1 3 b * a] | |
[ 1 3 b * a] | |
[a 1 3 b 0 2 ] | |
[a 1 3 b 0 2 ] | |
[a 1 3 b 0 2 ] | |
[a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b * ] | |
[ a 1 3 b * ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a1 3 b 0 2 ] | |
[ a 1 3 b 0 2 ] | |
[ a1 3 b 0 2 ] | |
[ a1 3 b 0 2 ] | |
[ * 3 b 0 2 ] | |
[ a1 3 b 0 2 ] | |
[ 1a 3 b 0 2 ] | |
[ * 3 b 0 2 ] | |
[ a1 3 b 0 2 ] | |
[ 1a 3 b 0 2 ] | |
[ * 3 b 0 2 ] | |
[ 1a 3 b 0 2 ] | |
[ * 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2 ] | |
[1 a 3 b 0 2 ] | |
[ a 3 b 0 2 1] | |
[ a 3 b 0 2 1 ] | |
[ a 3 b 0 2 1 ] | |
[ a 3 b 0 * ] | |
[ a 3 b 0 1 2 ] | |
[ a 3 b 0 * ] | |
[ a 3 b 0 * ] | |
[ a 3 b 0 2 1 ] | |
[ a 3 b0 2 1] | |
[ a 3 b 0 * ] | |
[ a 3 b0 * ] | |
[ a 3 b0 * ] | |
[ a 3 b 0 2 1] | |
[1 a 3 b 0 2 ] | |
[ 1 a 3 b 0 2] | |
[* a 3 b 0 ] | |
[ 1 a 3 b 0 2] | |
[2 1 a 3 b 0 ] | |
[ 2 1 a 3 b 0 ] | |
[2 1 a 3 b 0 ] | |
[ * a 3 b 0 ] | |
[1 2 a 3 b 0 ] | |
[ * a 3 b 0 ] | |
[1 2 a 3 b 0 ] | |
[ 2 a 3 b 0 1] | |
[ 2 a 3 b 0 1 ] | |
[ 2 a 3 b 0 1] | |
[ 2 a 3 b 0 1 ] | |
[ 2 a 3 b 0 1 ] | |
[ 2 a 3 b 0 1 ] | |
[ 2 a 3 b0 1 ] | |
[ 2 a 3 0b 1 ] | |
[ 2 a 3 * 1] | |
[1 2 a 3 b0 ] | |
[ 2 a 3 * 1] | |
[ 2 a 3 * 1 ] | |
[ 2 a 3 b0 1 ] | |
[ 2 a 3 b 0 1 ] | |
[ 2 a 3 * 1 ] | |
[ 2 a 3 b0 1 ] | |
[ 2 a 3 * 1 ] | |
[ 2 a 3 * 1 ] | |
[ 2 a 3 b0 1 ] | |
[ 2 a 3 * 1 ] | |
[ 2 a 3 0 b 1 ] | |
[ 2 a 3 0b1 ] | |
[ 2 a 3 * ] | |
[ 2 a 3 1 * ] | |
[ 2 a 3 1 0b ] | |
[ 2 a 3 * b ] | |
[ 2 a 3 1 0b ] | |
[ 2 a 3 1 0 b ] | |
[ 2 a 3 1 0 b ] | |
[ 2 a 3 1 0 b ] | |
[ 2 a 3 1 0 b ] | |
[ 2 a 3 1 0 b ] | |
algorithm.iteration=251 | |
results['episode_reward_mean']=185578.6 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.346 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.344 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.123 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.194 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.144 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.271 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.163 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.431 | |
Sample game: | |
[ 3 1 0 b 2 a ] | |
[ 3 1 0 b 2 a ] | |
[ 3 1 0 b 2 a ] | |
[ 3 1 0 b 2 a ] | |
[ 3 1 0 b 2 a ] | |
[ 3 1 0 b 2 a ] | |
[ 3 1 0 b2 a ] | |
[ 3 1 0 b 2 a ] | |
[ 3 10 * a ] | |
[ 3 01 2b a ] | |
[ 3 0 1 * a ] | |
[ 3 0 1 * a ] | |
[ 3 0 1 2b a ] | |
[ * 1 2 b a ] | |
[ * 1 2 b a ] | |
[ * 1 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ *1 2 b a ] | |
[ 3 01 2 b a ] | |
[ *1 2 b a ] | |
[ 3 01 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ 3 01 2 b a ] | |
[ *1 2 b a ] | |
[ 3 01 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ 3 01 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ 3 01 2 b a ] | |
[ * 1 2 b a ] | |
[ 3 01 2 b a ] | |
[ * 1 2 b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ 3 01 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * 1 2 b a ] | |
[ 3 01 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ *1 2 b a ] | |
[ * 1 2 b a ] | |
[ * * b a ] | |
[ * 1 2 b a ] | |
[ *1 2 b a ] | |
[ * * b a ] | |
[ *1 2 b a ] | |
[ * * b a ] | |
[ 0 31 2 b a ] | |
[ * * b a ] | |
[ 0 31 2 b a ] | |
[ 0 3 * b a ] | |
[ 0 31 2 b a ] | |
[ 0 3 * b a ] | |
[ 0 31 2 b a ] | |
[ 0 3 * b a ] | |
[ 0 31 2 b a ] | |
[ 0 3* b a ] | |
[ 0 3 * b a ] | |
[ 0 3* b a ] | |
[ 0 3* b a ] | |
[ 0 31 2 b a ] | |
[ 0 3 * b a] | |
[ 0 3 * b a] | |
[ 0 3* b a] | |
[a 0 31 2 b ] | |
[a 0 3 * b ] | |
[a 0 3 * b ] | |
[a 0 3 * b ] | |
[ a 0 3 1 2 b ] | |
[ a * 1 2 b ] | |
[ a 3 0 1 2 b ] | |
[ a 3 0 1 2 b ] | |
[ a 3 0 * b ] | |
[ a 3 0 * b ] | |
[ a 3 0 1 2 b ] | |
[ a 3 01 2 b ] | |
[ a 3 01 2 b ] | |
[ a 3 01 2 b ] | |
[ a 3 01 2 b ] | |
[ a 3 102 b ] | |
[ a 3 0* b ] | |
[ a 3 201 b ] | |
[ a 3 201 b ] | |
[ a 3 *0 b ] | |
[ a 3 201 b ] | |
[ a 3 2 10 b ] | |
[ a 3 2 01 b ] | |
[ a 3 2 0 1 b ] | |
[ a 3 2 01 b ] | |
[ a 3 20 1 b ] | |
[ a 3 2 01 b ] | |
[ a 3 2 0 1 b ] | |
[ a 3 2 01 b ] | |
[ a 3 2 0 1 b ] | |
[ * 2 0 1 b ] | |
[ 3a 2 01 b ] | |
[ 3 a 2 01 b ] | |
[ 3 a 2 01 b ] | |
[ 3 * 01 b ] | |
[ 3 2a 01 b ] | |
[ 3 2 a 01 b ] | |
[ 3 2 a 01 b ] | |
[ 3 2 a 0 1 b ] | |
[3 2 a 0 1b ] | |
[ 2 a 0 b1 3] | |
[ 2 a 0 b 1 3 ] | |
[ 2 a 0 b 1 3 ] | |
[ 2 a 0 b 1 3 ] | |
[2 a 0 b 1 3 ] | |
[ a 0 b 1 3 2] | |
[ a 0 b 1 3 2 ] | |
[ * b 1 3 2 ] | |
[ 0a b 1 3 2 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 32 ] | |
[ 0 a b 1 32 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 32 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 3 2 ] | |
[ 0 a b 1 32 ] | |
[ 0 a b 1 3 2 ] | |
[0 a b 1 32 ] | |
[ a b 1 3 2 0] | |
[ a b 13 2 0 ] | |
[ a b 13 2 0 ] | |
[ a b 132 0 ] | |
[ a b 31 20 ] | |
[ a b 3*0 ] | |
[ a b 3 0* ] | |
[ a b * * ] | |
[ a b * * ] | |
[ a b 3 02 1 ] | |
[ a b * * ] | |
[ a b 3 02 1 ] | |
[ a b 3 0* ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 320 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b *2 1 ] | |
[ a b *2 1 ] | |
[ a b *2 1 ] | |
[ a b * 2 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 0* ] | |
[ a b 3 201 ] | |
[ a b 3 201 ] | |
[ a b 3 2 01 ] | |
[ a b 3 2 01 ] | |
[ a b 3 20 1 ] | |
[ a b 3 20 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 20 1 ] | |
[ a b 32 01 ] | |
[ a b 3 20 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b *2 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 20 1 ] | |
[ a b 32 01 ] | |
[ a b 3 2 01 ] | |
[ a b 3 201 ] | |
[ a b 3 2 10 ] | |
[ a b 32 01 ] | |
[ a b 3 20 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 20 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b * 2 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1 ] | |
[ a b 3 201 ] | |
[ a b 3 201 ] | |
[ a b 3 2 01 ] | |
[ a b 32 01 ] | |
[ a b 3 2 0 1 ] | |
[ a b 3 2 01 ] | |
[ a b 3 2 01 ] | |
[ a b 3 2 01 ] | |
[ a b 3 2 01] | |
[1 a b 32 0 ] | |
[ a b 3 2 0 1] | |
[1 a b 3 2 0 ] | |
[ a b 3 2 01] | |
[1 a b 3 2 0 ] | |
[ a b 3 20 1] | |
[1 a b 3 20 ] | |
[ a b 3 2 01] | |
[ a b 3 2 01 ] | |
[ a b 3 20 1] | |
[1 a b 320 ] | |
[ a b *2 1] | |
[1 a b 2* ] | |
[ 1 a b *2 ] | |
[ 1 a b 2* ] | |
[ 1 a b 320 ] | |
[ 1 a b 3 02 ] | |
[ 1 a b 320 ] | |
[ 1 a b 320 ] | |
[ 1 a b *2 ] | |
[ 1 a b 2* ] | |
[ 1 a b 2* ] | |
[1 a b 2* ] | |
[ a b 3201] | |
[1 a b 3 20] | |
[01 a b 3 2] | |
[201 a b 3 ] | |
[ 01 a b 32] | |
[ 0 1 a b 23] | |
[ 01 a b 32] | |
[ 0 1 a b 32 ] | |
[0 1 a b 3 2] | |
[201 a b 3 ] | |
[ 01 a b 3 2] | |
[201 a b 3 ] | |
[ 10 a b 3 2] | |
[201 a b 3 ] | |
[ *0 a b 3 ] | |
[2 10 a b 3 ] | |
[ 10 a b 32] | |
[ 10 a b 23] | |
[ 01 a b 32] | |
[ 01 a b 23] | |
[ 01 a b 32] | |
[ 0 1 a b 23] | |
[ 01 a b 32] | |
[2 01 a b 3 ] | |
[ 2 10 a b 3 ] | |
[2 10 a b 3 ] | |
[ 201 a b 3 ] | |
[ 201 a b 3 ] | |
[ *0 a b 3 ] | |
[ 201 a b 3 ] | |
[ *0 a b 3 ] | |
[ *0 a b 3 ] | |
[ 2 10 a b 3 ] | |
[2 01 a b 3] | |
[ 01 a b 32] | |
[2 10 a b 3 ] | |
[ 2 01 a b 3 ] | |
[ 20 1 a b 3 ] | |
[ 201 a b 3 ] | |
[ 2 10 a b 3 ] | |
[ 2 10 a b 3 ] | |
[ 2 10 a b 3 ] | |
[ 2 01 a b 3 ] | |
[2 01 a b 3 ] | |
[ 01 a b 3 2] | |
[ 01 a b 32 ] | |
[ 0 1 a b 23 ] | |
[ 01 a b2 3] | |
[ 10 a b 23 ] | |
[ 10 a b23 ] | |
[ 10 a b32 ] | |
[ 10 a * 2 ] | |
[ 01 a b 3 2] | |
[2 01 a b 3 ] | |
[ 2 10 a b3 ] | |
[2 10 a b 3 ] | |
[ 2 10 a b 3 ] | |
[2 10 a b3 ] | |
algorithm.iteration=252 | |
results['episode_reward_mean']=185476.40800000005 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.347 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.346 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.123 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.192 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.143 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.271 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.167 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.426 | |
Sample game: | |
[ a 32 b 1 0 ] | |
[ a 32 b 1 0 ] | |
[ a 23 b 1 0 ] | |
[ a 2 3b 1 0 ] | |
[ a 2 3 b 1 0 ] | |
[ a 2 3b 1 0 ] | |
[ a 23 b 1 0 ] | |
[ a 23 b 1 0 ] | |
[ a 32 b 1 0 ] | |
[ a 3 2 b 1 0 ] | |
[ a 3 2b 1 0 ] | |
[ a 3 2 b 1 0 ] | |
[ a 32 b 1 0 ] | |
[ a 3 2b 1 0 ] | |
[ a3 2 b 1 0 ] | |
[ 3a 2 b 1 0 ] | |
[ 3 a2 b * ] | |
[ 3 * b 0 1 ] | |
[ 3 * b 0 1 ] | |
[ 3 2a b 0 1 ] | |
[ 3 2 a b 0 1 ] | |
[ 3 2 a b 0 1 ] | |
[ 3 2 a b 0 1 ] | |
[3 2 a b 0 1 ] | |
[ 2 a b 0 1 3] | |
[ 2 a b 0 1 3 ] | |
[ 2 a b 0 1 3 ] | |
[ 2 a b 0 1 3 ] | |
[ 2 a b 0 1 3 ] | |
[ 2 a b 0 1 3 ] | |
[2 a b 0 1 3 ] | |
[ a b 0 1 3 2] | |
[ a b 0 1 3 2 ] | |
[ a b 0 1 3 2 ] | |
[ a b 0 1 3 2 ] | |
[ a b 0 1 3 2 ] | |
[ a b 0 1 3 2 ] | |
[ a b 0 1 3 2 ] | |
[ a b 0 13 2 ] | |
[ a b 0 13 2 ] | |
[ a b 0 31 2 ] | |
[ a b 0 31 2 ] | |
[ a b 0 3 1 2 ] | |
[ a b 03 1 2 ] | |
[ a b 03 1 2 ] | |
[ a b 03 1 2 ] | |
[ a b 30 1 2 ] | |
[ a b 30 * ] | |
[ a b 30 * ] | |
[ a b 30 2 1 ] | |
[ a b 30 2 1 ] | |
[ a b 032 1 ] | |
[ a b *3 1 ] | |
[ a b 032 1 ] | |
[ a b *3 1 ] | |
[ a b 3* 1 ] | |
[ a b 032 1 ] | |
[ a b 3* 1 ] | |
[ a b 032 1 ] | |
[ a b 30 * ] | |
[ a b 032 1 ] | |
[ a b 30 * ] | |
[ a b 3* 1 ] | |
[ a b 30 2 1 ] | |
[ a b 30 * ] | |
[ a b 30 2 1 ] | |
[ a b 3* 1 ] | |
[ a b 30 2 1 ] | |
[ a b 30 * ] | |
[ a b 30 2 1 ] | |
[ a b 30 * ] | |
[ a b 30 2 1 ] | |
[ a b 032 1 ] | |
[ a b 30 * ] | |
[ a b 032 1 ] | |
[a b 30 * ] | |
[a b 30 2 1 ] | |
[a b 30 * ] | |
[a b 30 2 1 ] | |
[ b 032 1 a] | |
[ b 30 * a] | |
[ b 30 2 1 a] | |
[ b 30 * a ] | |
[ b 3 * a ] | |
[ b 3 * a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 30 2 1 a ] | |
[ b 30 2 1 a ] | |
[ b 3* 1 a ] | |
[ b 3 * 1 a ] | |
[ b 30 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 30 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 30 2 1 a ] | |
[ b 30 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 * 1 a ] | |
[ b 30 2 1 a ] | |
[ b 3 * 1 a ] | |
[ b 3 * a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 * a ] | |
[ b 32 1 0 a ] | |
[ b 32 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 1 0 a ] | |
[ b 3 * 0 a ] | |
[ b 3 * a ] | |
[ b 3 * a ] | |
[ b 3 * 0 a ] | |
[ b 3 * 0 a] | |
[ b3 1 * a] | |
[ * * 0 a] | |
[a * * 0 ] | |
[ b3 1 2 0 a] | |
[a b 3 1 2 0 ] | |
[ b3 1 * a] | |
[a b3 1 2 0 ] | |
[a b 3 * 0 ] | |
[a b 3 1 * ] | |
[a b3 1 * ] | |
[ a b 3 1 2 0 ] | |
[ a b3 1 2 0 ] | |
[ a 3b 1 * ] | |
[ a 3 b 1 * ] | |
[ a 3 b 1 * ] | |
[ a 3 b 1 * ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 * ] | |
[ a 3 b 1 * ] | |
[ a 3 b 1 * ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b * 0] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b * 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b * 0] | |
[0 a 3 b * ] | |
[ a 3 b 1 2 0] | |
[0 a 3 b 1 2 ] | |
[ a 3 b 1 *] | |
[0 a 3 b 1 2 ] | |
[ a 3 b * 0] | |
[0 a 3 b * ] | |
[ 0 a 3 b 1 2] | |
[* a 3 b 1 ] | |
[ 0 a 3 b 1 2] | |
[2 0 a 3 b 1 ] | |
[ 0 a 3 b *] | |
[2 0 a 3 b 1 ] | |
[ 2 0 a 3 b 1] | |
[* 0 a 3 b ] | |
[ 2 0 a 3 b 1] | |
[1 * a 3 b ] | |
[ 2 0 a 3 b 1] | |
[1 2 0 a 3 b ] | |
[ * 0 a 3 b ] | |
[1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ * 0 a 3 b ] | |
[ * 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 * a 3 b ] | |
[ * 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 * a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ * 0 a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 * a 3 b ] | |
[ 1 2 0 a 3 b ] | |
[ 1 * a 3 b ] | |
[ 1 2 0 a3 b ] | |
[ 1 * * b ] | |
[ 1 * 3a b ] | |
[ 1 * 3 a b ] | |
[ 1 0 2 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 0 2 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 0 2 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 * 3 a b ] | |
[ 1 2 03 a b ] | |
[ 1 *3 a b ] | |
[ 13* a b ] | |
[ 3* 0 a b ] | |
[ 31 * a b ] | |
[ 3 * 0 a b ] | |
[ 32 * a b ] | |
[ 3* 0 a b ] | |
[ 32 1 0 a b ] | |
[ 3 2 * a b ] | |
[ 32 0 1 a b ] | |
[ 32 * a b ] | |
[ 32 * a b ] | |
[ 23 * a b ] | |
[ 32 * a b ] | |
[ 32 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 * 1 a b ] | |
[ 3 * a b ] | |
[ 3 * a b ] | |
[ 3* 1 a b ] | |
[ 03* a b ] | |
algorithm.iteration=253 | |
results['episode_reward_mean']=185652.60599999997 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.354 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.343 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.119 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.191 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.139 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.273 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.168 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.431 | |
Sample game: | |
[ b 1 3 2 0 a] | |
[a b 1 3 2 0 ] | |
[a b 1 3 2 0 ] | |
[a b 1 3 2 0 ] | |
[a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 3 2 0 ] | |
[ a b 1 32 0 ] | |
[ a b 1 32 0 ] | |
[ a b 1 32 0 ] | |
[ a b 1 23 0 ] | |
[ a b 123 0 ] | |
[ a b *20 ] | |
[ a b *2 ] | |
[ a b 2* ] | |
[ a b *21 ] | |
[ a b *21 ] | |
[a b *2 1 ] | |
[a b *2 1 ] | |
[a b *2 1 ] | |
[a b *2 1 ] | |
[ b 3 021 a] | |
[ b *2 1 a] | |
[ b 3 021 a] | |
[ b * 21 a ] | |
[ b 3 021 a ] | |
[ b * 12 a ] | |
[ b 3 021 a ] | |
[ b * 21 a ] | |
[ b * 21 a ] | |
[ b 3 021 a ] | |
[ b * 21 a ] | |
[ b *21 a ] | |
[ b * 12 a ] | |
[ b 3 *2 a ] | |
[ b *21 a ] | |
[ b 3 021 a ] | |
[ b *2 1 a ] | |
[ b * 21 a ] | |
[ b 3 021 a ] | |
[ b 3 021 a ] | |
[ b 3 02 1 a ] | |
[ b * 21 a ] | |
[ b 3 021 a ] | |
[ b *2 1 a ] | |
[ b * 21 a ] | |
[ b 3 02 1 a ] | |
[ b 320 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 021 a ] | |
[ b 3 02 1 a ] | |
[ b 320 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 021 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 021 a ] | |
[ b 3 20 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 320 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 021 a ] | |
[ b 3 02 1 a ] | |
[ b 320 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 021 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2* a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 20 1 a ] | |
[b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 20 1 a ] | |
[b 3 20 1 a ] | |
[ b 3 02 1 a ] | |
[b 3 20 1 a ] | |
[b 3 20 1 a ] | |
[b 3 2 * a ] | |
[b 3 2 0 1 a ] | |
[b 3 2 * a ] | |
[b 3 2 0 1 a ] | |
[b 3 2 * a ] | |
[b 3 2 0 1 a ] | |
[b 3 2 0 1 a ] | |
[b 3 2 0 1 a ] | |
[ 3 2 0 1 a b] | |
[ 3 2 0 1 a b] | |
[ 3 20 1 a b] | |
[ 3 2 * a b ] | |
[ 3 20 1 a b] | |
[ 3 2 * a b] | |
[ 3 20 1 a b] | |
[ 3 2 * a b] | |
[ 3 2 0 1 a b] | |
[b 3 2 * a ] | |
[ 3 2 0 1 a b] | |
[b 3 2 0 1 a ] | |
[ 3 2 * a b] | |
[ 3 2 0 1 a b] | |
[ 3 2 * a b] | |
[ 3 2 * a b] | |
[ 3 2 * a b] | |
[ 3 2 * a b] | |
[ 3 2 0 1 a b] | |
[b 3 2 * a ] | |
[b 3 2 0 1 a ] | |
[b 3 2 0 1 a ] | |
[ 3 2 0 1 a b] | |
[b 3 2 * a ] | |
[ 3 20 1 a b] | |
[b 3 2 0 1 a ] | |
[ 3 2 * a b] | |
[ 3 2 0 1 a b] | |
[ 3 2 * a b] | |
[ 3 2 0 1 a b] | |
[ 3 2 * a b] | |
[ 3 2 * a b ] | |
[ 3 20 1 a b] | |
[ 3 20 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 02 1 a b ] | |
[ *2 1 a b ] | |
[ 3 021 a b ] | |
[ 3 02 1 a b ] | |
[ 3 021 a b ] | |
[ 3 20 1 a b ] | |
[ 3 20 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 021 a b ] | |
[ 3 20 1 a b ] | |
[ 3 2* a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 20 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 32 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 20 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 20 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 * a b ] | |
[ 3 20 1 a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 2 * a b ] | |
[ 3 2 0 1 a b ] | |
[ 3 20 1 a b ] | |
[ 3 20 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 20 1 a b ] | |
[ 320 1 a b ] | |
[ 3 02 1 a b ] | |
[ *2 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 20 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 20 1 a b ] | |
[ 3 02 1 a b ] | |
[ 3 20 1 a b ] | |
[ 3 2* a b ] | |
[ 321 0 a b] | |
[ 3 21 0 a b] | |
[ 3 120 a b] | |
[b 3 120 a ] | |
[b 3 2* a ] | |
[b 3 2* a ] | |
[b 32 * a ] | |
algorithm.iteration=254 | |
results['episode_reward_mean']=185626.016 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.363 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.341 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.115 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.189 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.135 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.270 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.168 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.439 | |
Sample game: | |
[ 3 a 0 1 b 2 ] | |
[ 3 a 0 1 b 2 ] | |
[ 3 a 0 1 b 2] | |
[2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b ] | |
[2 3 a 0 1 b ] | |
[ 3 a 0 1 b 2] | |
[2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b ] | |
[ 2 3 a 0 1 b] | |
[ 2 3 a 0 1 b] | |
[ 2 3 a0 1 b] | |
[ 2 3 * 1 b] | |
[b 2 3 0a 1 ] | |
[b 2 3 0 a 1 ] | |
[b 2 3 0 a 1 ] | |
[b 2 3 0 a 1 ] | |
[b 23 0 a 1 ] | |
[b 23 0 a 1 ] | |
[b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 32 0 a 1 ] | |
[ b 32 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 23 0 a 1 ] | |
[ b 2* a 1 ] | |
[ b 023 a 1 ] | |
[ b 023 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 023 a 1 ] | |
[ b 023 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 2 * a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 2* a 1 ] | |
[ b 023 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 2* a 1 ] | |
[ b 023 a 1 ] | |
[ b 023 a 1 ] | |
[ b 023 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 023 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 023 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 023 a 1 ] | |
[ b 023 a 1 ] | |
[ b 023 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 20 3 a 1 ] | |
[ b 02 3 a 1 ] | |
[ b 023 a 1] | |
[1 b 023 a ] | |
[ b 023 a 1] | |
[1 b 02 3 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 20 3 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 023 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 023 a ] | |
[ 1 b 023 a ] | |
[ 1 b 0 23 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 20 3 a ] | |
[ 1 b 20 3 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 20 3 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 023 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 023 a ] | |
[ 1 b 023 a ] | |
[ 1 b 0 23 a ] | |
[ 1 b 02 3 a ] | |
[ 1 b 023 a ] | |
[ 1 b 023 a] | |
[ 1 b 02 3 a] | |
[ 1 b 023 a] | |
[a 1 b 0 23 ] | |
[a 1 b 02 3 ] | |
[a 1 b 20 3 ] | |
[ a 1 b 02 3 ] | |
[ a 1 b 20 3 ] | |
[ a 1 b 2* ] | |
[ a 1 b 023 ] | |
[ a 1 b 023 ] | |
[ a 1 b 20 3 ] | |
[ a 1 b 023 ] | |
[ a 1 b 0 23 ] | |
[ a 1 b 02 3 ] | |
[ a 1 b 023 ] | |
[ a 1 b 023 ] | |
[ a 1 b 02 3 ] | |
[ a 1 b 02 3 ] | |
[ a 1 b 023 ] | |
[ a 1 b 02 3 ] | |
[ a 1 b 20 3 ] | |
[ a 1 b 20 3 ] | |
[ a 1 b 2 * ] | |
[ a 1 b 2 * ] | |
[ a 1 b 20 3 ] | |
[ a 1 b 2 0 3 ] | |
[ a 1 b 20 3 ] | |
[ a1 b 2 0 3 ] | |
[ * b 2 * ] | |
[ * b 23 0 ] | |
[ a1 b 2 3 0 ] | |
[ a 1 b 23 0 ] | |
[ * b 23 0 ] | |
[ a1 b 23 0 ] | |
[ a 1 b 23 0 ] | |
[ * b 32 0 ] | |
[ a1 b 32 0 ] | |
[ * b 32 0] | |
[ a1 b 3 2 0 ] | |
[ a1 b 3 2 0 ] | |
[ a 1 b 3 2 0 ] | |
[ a1 b 32 0 ] | |
[ 1a b 3 2 0 ] | |
[ 1 a b 32 0 ] | |
[ 1a b 320 ] | |
[ 1 a b 320 ] | |
[ 1 a b 3 02 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b 320 ] | |
[ 1 a b *2 ] | |
[ 1 a b 3 02 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b 320 ] | |
[ 1 a b *2 ] | |
[ 1 a b 023 ] | |
[ 1 a b 023 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b 3 02 ] | |
[ 1 a b *2 ] | |
[ 1a b *2 ] | |
[ * b 0 32 ] | |
[ a1 b 023 ] | |
[ a 1 b *2 ] | |
[ a 1 b 0 32 ] | |
[ a1 b *2 ] | |
[ * b *2 ] | |
[ a1 b *2 ] | |
[ 1a b *2 ] | |
[ * b *2 ] | |
[ 1a b *2 ] | |
[ 1 a b 0 32 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2 ] | |
[ 1 a b 2* ] | |
[ 1 a b *2 ] | |
[ 1 a b 320 ] | |
[ 1 a b *2 ] | |
[ 1 a b *2] | |
[ 1 a b *2 ] | |
[ 1 a b 3 02] | |
[ 1 a b *2 ] | |
[ 1 a b *2] | |
[ 1 a b *2 ] | |
[ 1 a b 3 02] | |
[2 1 a b * ] | |
[ 1 a b *2] | |
[2 1 a b * ] | |
[ 1 a b *2] | |
[2 1 a b 3 0] | |
[ 2 1 a b * ] | |
[2 1 a b 3 0] | |
[ 1 a b *2] | |
[2 1 a b * ] | |
[ 1 a b 3 02] | |
[2 1 a b 3 0] | |
[ 1 a b 3 02] | |
[2 1 a b 3 0] | |
[ 1 a b 3 02] | |
[2 1 a b * ] | |
[ 1 a b 3 02] | |
[ 1 a b 3 02 ] | |
[ 1 a b 3 02] | |
[ 1 a b 3 02 ] | |
[ 1 a b 3 02 ] | |
[1 a b 3 02 ] | |
[ 1 a b 3 02] | |
[ 1 a b 3 02 ] | |
[ 1 a b 3 02 ] | |
[1 a b 3 02 ] | |
[ a b 3 02 1] | |
[1 a b 3 02 ] | |
[ a b 3 02 1] | |
[1 a b *2 ] | |
[ a b * 2 1] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1] | |
[1 a b 3 02 ] | |
[ a b *2 1] | |
[ a b 3 02 1 ] | |
[ a b * 2 1] | |
[ a b 3 02 1 ] | |
[ a b 3 02 1] | |
[ a b 3 02 1 ] | |
[ a b 3 201 ] | |
[ a b 3 201 ] | |
[ a b 3 2 01] | |
[ a b 3 2 10] | |
[ a b 3 2 01] | |
[ a b 3 2 10] | |
[ a b 3 2 01] | |
[ a b 3 2 01 ] | |
[ a b 3 201 ] | |
[ a b 3 2 01 ] | |
[ a b 3 2 01] | |
[ a b 3 2 01 ] | |
[ a b 3 20 1] | |
[ a b 3 201 ] | |
[ a b 3 2 01] | |
[ a b 3 201 ] | |
[ a b 3 2 01] | |
[1 a b 3 20 ] | |
[ a b 3 20 1] | |
[ a b 320 1 ] | |
[ a b 3 201 ] | |
[ a b 3 201 ] | |
[ a b 3 2 01] | |
[ a b 3 2 01 ] | |
[ a b 3 201 ] | |
[ a b 3 *0 ] | |
[ a b 3 *0 ] | |
[ a b 32 10 ] | |
[ a b 3 201 ] | |
[ a b 32 01 ] | |
[ a b 32 01] | |
[ a b 3 2 01 ] | |
[ a b 32 10 ] | |
[ a b 3 2 10 ] | |
[ a b 3 201 ] | |
[ a b 3 201 ] | |
[ a b 3 201] | |
[1 a b 3 20] | |
[0 a b 3 2 1] | |
[ a b 32 10] | |
[0 a b 23 1] | |
[ a b 32 10] | |
[0 a b 32 1] | |
[1 a b 320] | |
[0 a b 3*] | |
[10 a b 32 ] | |
[01 a b 23 ] | |
[10 a b 32 ] | |
[ 10 a b 32 ] | |
[10 a b 3 2 ] | |
[01 a b 32 ] | |
[10 a b 3 2 ] | |
[01 a b 3 2] | |
[201 a b 3 ] | |
[ 201 a b 3 ] | |
[ 201 a b 3] | |
[3 201 a b ] | |
[ 2 01 a b 3] | |
[ 2 10 a b 3 ] | |
[ 2 10 a b 3] | |
[3 2 10 a b ] | |
[ 32 01 a b ] | |
[ 23 01 a b ] | |
[ 23 01 a b ] | |
algorithm.iteration=255 | |
results['episode_reward_mean']=185519.67200000002 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.365 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.343 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.115 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.184 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.134 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.271 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.161 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.446 | |
Sample game: | |
[ *3 0 1 a ] | |
[ 2b 3 0 1 a ] | |
[ 2 b3 * a ] | |
[ 2* * a ] | |
[ 2 b3 * a ] | |
[ 2 b3 * a ] | |
[ 2 * * a ] | |
[ 2 3b * a ] | |
[ 2 3 b * a ] | |
[ 23 b * a ] | |
[ 32 b 0 1 a ] | |
[ 32b 0 1 a ] | |
[ 2* 0 1 a ] | |
[ 23b * a ] | |
[ 2* 1 0 a ] | |
[ b23 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b23 1 0 a ] | |
[ * 3 1 0 a ] | |
[ * 3 1 0 a ] | |
[ 2b 3 1 0 a ] | |
[2 b3 1 0 a ] | |
[ * 3 1 0 a ] | |
[ b23 1 0 a ] | |
[ b32 * a ] | |
[b 32 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 32 * a ] | |
[ b 3 2 0 1 a ] | |
[ b 32 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ * 20 1 a ] | |
[ b3 2 * a ] | |
[ b 3 2 * a ] | |
[ * 2 0 1 a ] | |
[ b3 2 0 1 a ] | |
[ * 2 * a ] | |
[ b3 2 0 1 a ] | |
[ b 3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b3 2 * a ] | |
[ * 2 0 1 a ] | |
[ 3b 2 * a ] | |
[ 3 b2 * a ] | |
[ 3* 1 0 a ] | |
[ 2* 1 0 a ] | |
[ 2b 3 * a ] | |
[ 2 b3 * a ] | |
[ 2* 1 0 a ] | |
[ b23 1 0 a ] | |
[ * 3 1 0 a ] | |
[ 2b 3 1 0 a ] | |
[ 2b 3 1 0 a ] | |
[ * 3 1 0 a ] | |
[ 2b 3 1 0 a ] | |
[ *3 1 0 a ] | |
[ * 3 1 0 a ] | |
[ b23 1 0 a ] | |
[ * 3 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b3 2 1 0 a ] | |
[ b 3 2 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 23 * a ] | |
[ b 23 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 23 1 0 a ] | |
[ b 32 1 0 a ] | |
[ b 23 * a ] | |
[ b 32 * a ] | |
[ b 32 * a ] | |
[ b 32 * a ] | |
[ b 32 0 1 a ] | |
[ b3 2 * a ] | |
[ * 2 0 1 a ] | |
[ 3b 2 0 1 a ] | |
[ 3 b 2 0 1 a ] | |
[ 3b 2 0 1 a ] | |
[ * 2 * a ] | |
[ 3b 2 0 1 a ] | |
[ * 2 0 1 a ] | |
[ b3 2 * a ] | |
[ 3b 2 0 1 a ] | |
[ * 2 * a ] | |
[ 3b 2 0 1 a ] | |
[ b3 2 0 1 a ] | |
[ b3 2 0 1 a ] | |
[ b 3 2 * a ] | |
[ b3 2 1 0 a ] | |
[ * 2 1 0 a ] | |
[ 3b 2 1 0 a ] | |
[ 3b 2 1 0 a ] | |
[ * 2 1 0 a ] | |
[ b3 2 1 0 a ] | |
[ * 2 1 0 a ] | |
[ * 2 1 0 a ] | |
[ 3b 2 1 0 a ] | |
[ 3 b 2 1 0 a ] | |
[ * 2 1 0 a ] | |
[ 3 b 2 1 0 a ] | |
[ 3 b 2 1 0 a ] | |
[ 3 b 2 * a ] | |
[ 3 b 2 * a ] | |
[ 3 b 20 1 a ] | |
[ 3 b 2* a ] | |
[ 3 b 120 a ] | |
[ 3 b 120 a ] | |
[ 3 b 120 a ] | |
[3 b 21 0 a ] | |
[ b 120 a 3] | |
[ b 21 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 1 2 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 1 2 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 21 0 a 3 ] | |
[ b 21 0 a 3 ] | |
[ b 21 0 a 3 ] | |
[ b 21 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 1 20 a 3 ] | |
[ b 120 a 3 ] | |
[ b 1 20 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 21 0 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 12 0 a 3] | |
[3 b 12 0 a ] | |
[ 3 b 21 0 a ] | |
[3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[3 b 1 2 0 a ] | |
[ b 12 0 a 3] | |
[3 b 1 2 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 1 20 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[3 b 1 2 0 a ] | |
[ 3 b 1 2 0 a ] | |
[3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[3 b 1 2 0 a ] | |
[ 3 b 12 0 a ] | |
[3 b 1 2 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 1 2 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 1 2 0 a ] | |
[ 3 b 1 2 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[ 3 b 12 0 a ] | |
[3 b 12 0 a ] | |
[ b 1 2 0 a 3] | |
[ b 12 0 a 3 ] | |
[ b 1 20 a 3 ] | |
[ b 12 0 a 3 ] | |
[ b 1 20 a 3 ] | |
[ b 120 a 3 ] | |
[ b 1 02 a 3 ] | |
[ b *2 a 3 ] | |
[ b *2 a 3] | |
[ b 1 02 a 3 ] | |
[ b *2 a 3] | |
[ b 1 02 a 3 ] | |
[ b 1 02 a 3] | |
[3 b 1 02 a ] | |
[ b 1 02 a 3] | |
[3 b 120 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b *2 a ] | |
[ 3 b *2 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b *2 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b *2 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b 120 a ] | |
[ 3 b 1 02 a ] | |
[3 b 1 02 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b *2 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b 120 a ] | |
[ 3 b 1 02 a ] | |
[ 3 b 1 02 a ] | |
[3 b *2 a ] | |
[ b 1 02 a3] | |
[ b *2 * ] | |
[ b 1 02 3a ] | |
[ b *2 3a ] | |
[ b 1 02 3 a ] | |
[ b 1 02 3 a ] | |
[ b *2 3 a ] | |
[ b 1 02 3 a ] | |
[ b 1 02 3 a ] | |
[ b * 2 3 a ] | |
[ b *2 3 a ] | |
[ b 1 02 3 a ] | |
[ b 1 02 3 a ] | |
[ b 1 02 3 a ] | |
[ b *2 3 a ] | |
[ b 1 02 3 a ] | |
[ b *2 3 a ] | |
[ b 1 02 3 a ] | |
[ b 120 3 a ] | |
[ b 12 * a ] | |
[ b 1 2* a ] | |
[ b 1 320 a ] | |
[ b 123 0 a ] | |
[ b 123 0 a ] | |
[ b *2 0 a ] | |
[ b 321 0 a ] | |
[ b 32* a ] | |
[ b 321 0 a ] | |
[ b 23 * a ] | |
[ b 2* 0 a ] | |
[ b 21 3 0 a ] | |
[ b 2* 0 a ] | |
[ b 2 * a ] | |
[ b 2 * a ] | |
[ b 2 * a ] | |
[ b 2 * a ] | |
[ b 2 * 1 a ] | |
[ b 23 * a ] | |
[ b 32 * a ] | |
[ b 32 0 1 a ] | |
[ b 23 * a ] | |
[ b 23 * a ] | |
[ b 23 0 1 a ] | |
[ b 23 * a ] | |
[ b 32 * a ] | |
[ b 3 2 * a ] | |
[ b 32 * a ] | |
[ b 23 * a ] | |
[ b 23 * a ] | |
[ b 23 0 1 a ] | |
[ b 32 0 1 a] | |
[ b 32 * a] | |
[ b 3 2 0 1 a] | |
[ b 3 2 * a] | |
[ b 3 2 0 1 a] | |
[a b 3 2 * ] | |
[a b 3 20 1 ] | |
[a b 3 2* ] | |
[ a b 3 2 * ] | |
[ a b 3 2 * ] | |
[ a b3 2 1 0 ] | |
[ a b3 2 * ] | |
[ a b 3 21 0 ] | |
[ a b3 21 0 ] | |
[ a b3 21 0 ] | |
[ a b 3 12 0 ] | |
[ a b3 12 0 ] | |
[ a b3 12 0 ] | |
[ a * 120 ] | |
[ a 3b 1 20 ] | |
[ a 3 b 120 ] | |
[ a 3 b 12 0 ] | |
[ a 3 b 120 ] | |
[ a 3 b 12 0 ] | |
[ a 3 b 120 ] | |
[ a 3 b 21 0 ] | |
[ a 3 b 12 0 ] | |
[ a 3 b 21 0 ] | |
[ a 3 b 12 0 ] | |
[ a 3 b 1 2 0 ] | |
[ a 3 b 12 0 ] | |
[ a 3 b 12 0 ] | |
[ a 3 b 1 2 0 ] | |
algorithm.iteration=256 | |
results['episode_reward_mean']=185692.82999999996 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.368 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.343 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.114 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.183 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.130 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.268 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.155 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.459 | |
Sample game: | |
[ 1 3 b a 0 2 ] | |
[ 1 3 b a 0 2] | |
[2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 1 3 b a 0 ] | |
[ 2 * b a 0 ] | |
[ 2 * b a 0 ] | |
[ 2 3 1 b a 0 ] | |
[ 2 3 1 b a 0 ] | |
[ 23 1 b a 0] | |
[0 23 1 b a ] | |
[ 0 32 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 32 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 32 1 b a ] | |
[ 0 23 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 2* 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 23 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 0 32 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ 023 1 b a ] | |
[ *2 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[ 023 1 b a] | |
[a 023 1 b ] | |
[ 023 1 b a] | |
[a *2 1 b ] | |
[a 023 1 b ] | |
[a 0 32 1 b ] | |
[a 023 1 b ] | |
[a 023 1 b ] | |
[a 023 1 b ] | |
[a 0 23 1 b ] | |
[ a 023 1 b ] | |
[ a 0 32 1 b ] | |
[ a 023 1 b ] | |
[a *2 1 b ] | |
[a 023 1 b ] | |
[a *2 1 b ] | |
[ 023 1 b a] | |
[a *2 1 b ] | |
[a 023 1 b ] | |
[a 023 1 b ] | |
[a 023 1 b ] | |
[a 023 1 b ] | |
[ a *2 1 b ] | |
[ a 023 1 b ] | |
[ a *2 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b ] | |
[ a 0 32 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b] | |
[ a 023 1 b ] | |
[ a 0 32 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b ] | |
[ a 0 32 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b ] | |
[ a 023 1 b] | |
[ a 023 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b ] | |
[ a 023 1 b] | |
[ a 023 1 b ] | |
[ a 0 32 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[ a 023 1 b] | |
[b a 023 1 ] | |
[b a 0 32 1 ] | |
[b a 023 1 ] | |
[ a 023 1 b] | |
[b a 023 1 ] | |
[b a 023 1 ] | |
[b a 023 1 ] | |
[b a 023 1 ] | |
[b a 023 1 ] | |
[b a 023 1 ] | |
[b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 0 32 1 ] | |
[ b a 023 1 ] | |
[ b a *2 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 0 32 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a *2 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a *2 1 ] | |
[ b a 023 1 ] | |
[ b a *2 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 023 1 ] | |
[ b a 0 32 1 ] | |
[ b a 023 1 ] | |
[ b a *2 1 ] | |
[ b a 023 1 ] | |
algorithm.iteration=257 | |
results['episode_reward_mean']=186094.41999999995 | |
blue_agent_0_proximity_to_red_agent_0_mean=0.378 | |
blue_agent_0_proximity_to_red_agent_1_mean=0.341 | |
blue_agent_0_proximity_to_red_agent_2_mean=0.112 | |
blue_agent_0_proximity_to_red_agent_3_mean=0.181 | |
blue_agent_1_proximity_to_red_agent_0_mean=0.124 | |
blue_agent_1_proximity_to_red_agent_1_mean=0.271 | |
blue_agent_1_proximity_to_red_agent_2_mean=0.153 | |
blue_agent_1_proximity_to_red_agent_3_mean=0.469 | |
Sample game: | |
[ 2 a 3 0 b1 ] | |
[ 2 a 3 0 b1 ] | |
[ 2 a 3 0 * ] | |
[ 2 a 3 0 b1 ] | |
[ 2 a 3 0 * ] | |
[ 2 a 3 0 * ] | |
[ 2 a 3 0 1b ] | |
[ 2 a 3 0 1 b ] | |
[ 2 a 3 0 * ] | |
[ 2 a 3 0 1b ] | |
[ 2 a 3 0 1 b ] | |
[ 2 a 3 0 * ] | |
[ 2 a 3 0 b1 ] | |
[ 2 a 3 0 * ] | |
[ 2 a 3 0 1b ] | |
[ 2 a 3 0 1 b ] | |
[2 a 3 0 1 b ] | |
[ a 3 0 1 b 2] | |
[ a 3 0 1 b 2 ] | |
[ a3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a3 0 1 b 2 ] | |
[ * 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 * b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 * b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 * b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 * b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b 2 ] | |
[ a 3 0 1 b2 ] | |
[ a 3 0 1 b2 ] | |
[ a 3 * * ] | |
[ a * 1 2b ] | |
[ a * 1 2b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 * 2 b ] | |
[ a 0 3 1 * ] | |
[ a 0 * 2b ] | |
[ a 0 3 1 2 b ] | |
[ a * 1 2 b ] | |
[ a 3 * 2b ] | |
[ a * 1 2 b ] | |
[ a * 1 * ] | |
[ a * 2b ] | |
[ a * 1 * ] | |
[ a 0 * 2b ] | |
[ a 0 3 1 2b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 * 2 b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 * 2 b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 3 1 2 b ] | |
[ a 0 3 1 2 b ] | |
[a 0 3 1 2 b ] | |
[a * 1 2 b ] | |
[a 3 0 1 2 b ] | |
[ * 1 2 b a] | |
[ * 1 2 b a] | |
[ * 2 b a] | |
[ 3 * 2 b a ] | |
[ * 2 b a ] | |
[ * 1 2 b a ] | |
[ 3 * 2 b a ] | |
[ 3 * 2b a ] | |
[ * 1 2b a ] | |
[ 3 * 2 b a ] | |
[ * 1 2b a ] | |
[ * 1 b2 a ] | |
[ * 1 * a ] | |
[ 0 3 1 b2 a ] | |
[ 0 * b 2 a ] | |
[ 0 3 1 b 2 a ] | |
[ 0 * b2 a ] | |
[ 0 3 1 * a ] | |
[ 0 3 1 b 2 a ] | |
[ 0 3 1 b2 a ] | |
[ 0 * b 2 a ] | |
[ 0 3 1 b 2 a ] | |
[ 0 * b 2 a ] | |
[ 0 * b 2 a ] | |
[ 0 3 1 b 2 a ] | |
[ 0 * b2 a ] | |
[ 0 * b 2 a ] | |
[ 0 3 1 b 2 a ] | |
[ 0 3 1 b 2 a ] | |
[ 0 * b 2 a ] | |
[ 0 3 1 b2 a ] | |
[ 0 3 1 b2 a ] | |
[ 0 3 1 * a ] | |
[ 0 3 1 2b a ] | |
[ 0 * b2 a ] | |
[ 0 * * a ] | |
[ 0 * 2b a ] | |
[ 0 * 2 b a ] | |
[0 3 1 * a ] | |
[ 0 * 2b a ] | |
[ 0 * 2 b a ] | |
[ 0 * 2 b a ] | |
[ 0 3 1 2b a ] | |
[ 0 3 1 * a ] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ 3 1 b2 a 0] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[ 3 1 b 2 a 0 ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[ 3 1 b 2 a 0 ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ * b 2 a 0] | |
[0 * b 2 a ] | |
[ 0 * b 2 a ] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[ 3 1 b 2 a 0 ] | |
[ 3 1 b 2 a 0] | |
[ 3 1 b 2 a 0 ] | |
[ 3 1 b 2 a 0] | |
[0 * b 2 a ] | |
[ * b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ * b 2 a 0] | |
[ * b 2 a 0 ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ 0 3 1 b 2 a ] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[0 3 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[3 1 b 2 a 0 ] | |
[ 3 1 b 2 a 0] | |
[* 1 b 2 a ] | |
[ 0 1 b 2 a 3] | |
[* 1 b 2 a ] | |
[ 1 b 2 a *] | |
[ 1 b 2 a * ] | |
[ 1 b 2 a 3 0] | |
[0 1 b 2 a 3 ] | |
[ 1 b 2 a 3 0] | |
[0 1 b 2 a 3 ] | |
[ 0 1 b 2 a 3 ] | |
[ 0 1 b 2 a 3 ] | |
[ 0 1 b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[ * b 2 a 3] | |
[ * b 2 a 3 ] | |
[ 0 1 b 2 a 3] | |
[* 1 b 2 a ] | |
[ 3 1 b 2 a 0] | |
[3 1 b 2 a 0 ] | |
[ 1 b 2 a *] | |
[3 1 b 2 a 0 ] | |
[ 1 b 2 a *] | |
[0 1 b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[0 1 b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[0 1 b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[* b 2 a 3 ] | |
[ 0 b 2 a 3 1] | |
[0 b 2 a 3 1 ] | |
[ b 2 a 3 *] | |
[* b 2 a 3 ] | |
[ * b 2 a 3 ] | |
[* b 2 a 3 ] | |
[ b 2 a 3 *] | |
[1 b 2a 3 0 ] | |
[ b * 3 0 1] | |
[ b 2a 3 0 1 ] | |
[ b a2 3 * ] | |
[ b * 3 0 1 ] | |
[ b a2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 2 3 0 1 ] | |
[ b a 23 0 1 ] | |
[ b a 320 1 ] | |
[ b a 3 02 1 ] | |
[ b a * 2 1 ] | |
[ b a 0 32 1 ] | |
[ b a 023 1 ] | |
[ b a 0 2* ] | |
[ b a 0 123 ] | |
[ b a 0 1 23 ] | |
[ b a 0 123 ] | |
[ b a 0 1 32 ] | |
[ b a 0 1 32 ] | |
[ b a 0 1 32 ] | |
[ b a0 *2 ] | |
[ b * 321 ] | |
[ b 0 a *2 ] | |
[ b 0 a *2 ] | |
[ b 0 a * 2 ] | |
[ b 0 a * 2 ] | |
[ b 0 a * 2 ] | |
[ b 0 a * 2 ] | |
[ b 0 a * 2 ] | |
[ b 0 a* 2 ] | |
[ b 0 * 2 ] | |
[ b 0 *a 2 ] | |
[ b 0 * a 2 ] | |
[ b 0 * a2 ] | |
[ b 0 * a 2 ] | |
[ b 0 * a 2 ] | |
[ b 0 * a2 ] | |
[ b 0 * * ] | |
[ b 0 * 2a ] | |
[ b 0 * 2 a ] | |
[ b 0 * 2 a ] | |
[ b 0 * 2 a ] | |
[ b 0 * 2 a ] | |
[ b 0 * 2 a ] | |
[ b 0 * 2 a ] | |
[ b 0 * 2 a ] | |
[ b * 2 a ] | |
[ b * 2 a ] | |
[ b * 0 2 a ] | |
[ b 3 1 0 2 a ] | |
[ b * 0 2 a ] | |
[ b 3 * 2 a ] | |
[ b 3 1 0 2 a ] | |
[ b 3 * 2 a ] | |
[ b 3 1 0 2 a ] | |
[ b 3 * 2 a ] | |
[ b 3 *2 a ] | |
[ b 3 2* a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 2 * a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b *2 1 a ] | |
[ b 3 021 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 20 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 02 1 a ] | |
[ b 3 021 a ] | |
[ b 3 02 1 a ] | |
[ b * 21 a ] | |
[ b 3 021 a ] | |
[ b *2 1 a ] | |
[ b 3 021 a ] | |
[ b 3 02 1 a ] | |
[ b * 21 a ] | |
[ b 3 021 a ] | |
[ b 3 021 a ] | |
[ b 3 021 a ] | |
[ b *2 1 a ] | |
[ b 3 021 a ] | |
[ b *2 1 a ] | |
[ b * 21 a ] | |
[b 3 021 a ] | |
[b *2 1 a ] | |
[b * 21 a ] |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment