k: policy_iteration
aglo_results: {'Values': array([[-2.46275854, -2.76083815, -3.02708341, -3.18470615, -3.26295115,
-3.29789396, -3.30884987, -3.30567726, -3.31830887, -3.32485289],
[-1.2986248 , -2.08484303, -2.70245736, -3.03813227, -3.19690025,
-3.26660233, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759509, -0.09673608, -1.79185073, -2.63499651, -3.02416847,
-3.19059198, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316139, 5.09782531, 0.46290022, -1.70402077, -2.65885863,
-3.05780082, -3.210497 , -3.24596799, -3.29642296, -3.3155428 ],
[46.06376654, 18.01479973, 5.5578918 , 0.13229419, -2.02689072,
-2.84858819, -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984743, 14.6652538 , 2.47234784, -1.4139694 ,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475872, 17.72107474, 5.16077726, -0.08199397, -2.12226736,
-2.88874854, -3.17126198, -3.27422222, -3.31125225, -3.32339259],
[13.94655062, 5.41280061, 0.47378806, -1.78729709, -2.71857466,
-3.09305105, -3.24062394, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928477, 0.22803461, -1.64398709, -2.60683311, -3.0337407 ,
-3.21118832, -3.28406823, -3.3135965 , -3.32528326, -3.32940849],
[-0.67919718, -1.63281145, -2.45812666, -2.93394332, -3.1618047 ,
-3.26065235, -3.3029011 , -3.32068652, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
algo_targets: {'Values': array([[-2.46275855, -2.76083816, -3.02708342, -3.18470617, -3.26295116,
-3.29789398, -3.30884988, -3.30567727, -3.31830888, -3.3248529 ],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636817, -3.26581578, -3.30278956, -3.31802396],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701567, -3.30686576],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780082, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.84858819, -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984743, 14.66525379, 2.47234783, -1.4139694 ,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475872, 17.72107474, 5.16077726, -0.08199397, -2.12226736,
-2.88874854, -3.17126198, -3.27422222, -3.31125226, -3.32339259],
[13.94655062, 5.41280061, 0.47378806, -1.78729709, -2.71857467,
-3.09305105, -3.24062394, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928477, 0.22803461, -1.64398709, -2.60683311, -3.0337407 ,
-3.21118832, -3.28406823, -3.3135965 , -3.32528326, -3.32940849],
[-0.67919718, -1.63281145, -2.45812666, -2.93394332, -3.1618047 ,
-3.26065235, -3.3029011 , -3.32068652, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
k: value_iteration
aglo_results: {'Values': array([[-2.46275855, -2.76083815, -3.02708342, -3.18470616, -3.26295115,
-3.29789397, -3.30884988, -3.30567726, -3.31830888, -3.32485289],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780083, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.8485882 , -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984742, 14.66525379, 2.47234783, -1.41396941,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475871, 17.72107474, 5.16077725, -0.08199398, -2.12226737,
-2.88874855, -3.17126199, -3.27422222, -3.31125226, -3.32339259],
[13.94655061, 5.4128006 , 0.47378805, -1.7872971 , -2.71857467,
-3.09305106, -3.24062395, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928476, 0.2280346 , -1.6439871 , -2.60683312, -3.03374071,
-3.21118833, -3.28406823, -3.31359651, -3.32528326, -3.3294085 ],
[-0.6791972 , -1.63281146, -2.45812667, -2.93394334, -3.16180472,
-3.26065236, -3.30290111, -3.32068653, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
algo_targets: {'Values': array([[-2.46275855, -2.76083815, -3.02708342, -3.18470616, -3.26295115,
-3.29789397, -3.30884988, -3.30567726, -3.31830888, -3.32485289],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780083, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.8485882 , -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984742, 14.66525379, 2.47234783, -1.41396941,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475871, 17.72107474, 5.16077725, -0.08199398, -2.12226737,
-2.88874855, -3.17126199, -3.27422222, -3.31125226, -3.32339259],
[13.94655061, 5.4128006 , 0.47378805, -1.7872971 , -2.71857467,
-3.09305106, -3.24062395, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928476, 0.2280346 , -1.6439871 , -2.60683312, -3.03374071,
-3.21118833, -3.28406823, -3.31359651, -3.32528326, -3.3294085 ],
[-0.6791972 , -1.63281146, -2.45812667, -2.93394334, -3.16180472,
-3.26065236, -3.30290111, -3.32068653, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
k: td_lambda
aglo_results: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
algo_targets: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
k: policy_iteration
aglo_results: {'Values': array([[-2.46275854, -2.76083815, -3.02708341, -3.18470615, -3.26295115,
-3.29789396, -3.30884987, -3.30567726, -3.31830887, -3.32485289],
[-1.2986248 , -2.08484303, -2.70245736, -3.03813227, -3.19690025,
-3.26660233, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759509, -0.09673608, -1.79185073, -2.63499651, -3.02416847,
-3.19059198, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316139, 5.09782531, 0.46290022, -1.70402077, -2.65885863,
-3.05780082, -3.210497 , -3.24596799, -3.29642296, -3.3155428 ],
[46.06376654, 18.01479973, 5.5578918 , 0.13229419, -2.02689072,
-2.84858819, -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984743, 14.6652538 , 2.47234784, -1.4139694 ,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475872, 17.72107474, 5.16077726, -0.08199397, -2.12226736,
-2.88874854, -3.17126198, -3.27422222, -3.31125225, -3.32339259],
[13.94655062, 5.41280061, 0.47378806, -1.78729709, -2.71857466,
-3.09305105, -3.24062394, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928477, 0.22803461, -1.64398709, -2.60683311, -3.0337407 ,
-3.21118832, -3.28406823, -3.3135965 , -3.32528326, -3.32940849],
[-0.67919718, -1.63281145, -2.45812666, -2.93394332, -3.1618047 ,
-3.26065235, -3.3029011 , -3.32068652, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
algo_targets: {'Values': array([[-2.46275855, -2.76083816, -3.02708342, -3.18470617, -3.26295116,
-3.29789398, -3.30884988, -3.30567727, -3.31830888, -3.3248529 ],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636817, -3.26581578, -3.30278956, -3.31802396],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701567, -3.30686576],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780082, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.84858819, -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984743, 14.66525379, 2.47234783, -1.4139694 ,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475872, 17.72107474, 5.16077726, -0.08199397, -2.12226736,
-2.88874854, -3.17126198, -3.27422222, -3.31125226, -3.32339259],
[13.94655062, 5.41280061, 0.47378806, -1.78729709, -2.71857467,
-3.09305105, -3.24062394, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928477, 0.22803461, -1.64398709, -2.60683311, -3.0337407 ,
-3.21118832, -3.28406823, -3.3135965 , -3.32528326, -3.32940849],
[-0.67919718, -1.63281145, -2.45812666, -2.93394332, -3.1618047 ,
-3.26065235, -3.3029011 , -3.32068652, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
k: value_iteration
aglo_results: {'Values': array([[-2.46275855, -2.76083815, -3.02708342, -3.18470616, -3.26295115,
-3.29789397, -3.30884988, -3.30567726, -3.31830888, -3.32485289],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780083, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.8485882 , -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984742, 14.66525379, 2.47234783, -1.41396941,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475871, 17.72107474, 5.16077725, -0.08199398, -2.12226737,
-2.88874855, -3.17126199, -3.27422222, -3.31125226, -3.32339259],
[13.94655061, 5.4128006 , 0.47378805, -1.7872971 , -2.71857467,
-3.09305106, -3.24062395, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928476, 0.2280346 , -1.6439871 , -2.60683312, -3.03374071,
-3.21118833, -3.28406823, -3.31359651, -3.32528326, -3.3294085 ],
[-0.6791972 , -1.63281146, -2.45812667, -2.93394334, -3.16180472,
-3.26065236, -3.30290111, -3.32068653, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
algo_targets: {'Values': array([[-2.46275855, -2.76083815, -3.02708342, -3.18470616, -3.26295115,
-3.29789397, -3.30884988, -3.30567726, -3.31830888, -3.32485289],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780083, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.8485882 , -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984742, 14.66525379, 2.47234783, -1.41396941,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475871, 17.72107474, 5.16077725, -0.08199398, -2.12226737,
-2.88874855, -3.17126199, -3.27422222, -3.31125226, -3.32339259],
[13.94655061, 5.4128006 , 0.47378805, -1.7872971 , -2.71857467,
-3.09305106, -3.24062395, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928476, 0.2280346 , -1.6439871 , -2.60683312, -3.03374071,
-3.21118833, -3.28406823, -3.31359651, -3.32528326, -3.3294085 ],
[-0.6791972 , -1.63281146, -2.45812667, -2.93394334, -3.16180472,
-3.26065236, -3.30290111, -3.32068653, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
k: td_lambda
aglo_results: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
algo_targets: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
k: policy_iteration
aglo_results: {'Values': array([[-2.46275854, -2.76083815, -3.02708341, -3.18470615, -3.26295115,
-3.29789396, -3.30884987, -3.30567726, -3.31830887, -3.32485289],
[-1.2986248 , -2.08484303, -2.70245736, -3.03813227, -3.19690025,
-3.26660233, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759509, -0.09673608, -1.79185073, -2.63499651, -3.02416847,
-3.19059198, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316139, 5.09782531, 0.46290022, -1.70402077, -2.65885863,
-3.05780082, -3.210497 , -3.24596799, -3.29642296, -3.3155428 ],
[46.06376654, 18.01479973, 5.5578918 , 0.13229419, -2.02689072,
-2.84858819, -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984743, 14.6652538 , 2.47234784, -1.4139694 ,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475872, 17.72107474, 5.16077726, -0.08199397, -2.12226736,
-2.88874854, -3.17126198, -3.27422222, -3.31125225, -3.32339259],
[13.94655062, 5.41280061, 0.47378806, -1.78729709, -2.71857466,
-3.09305105, -3.24062394, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928477, 0.22803461, -1.64398709, -2.60683311, -3.0337407 ,
-3.21118832, -3.28406823, -3.3135965 , -3.32528326, -3.32940849],
[-0.67919718, -1.63281145, -2.45812666, -2.93394332, -3.1618047 ,
-3.26065235, -3.3029011 , -3.32068652, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
algo_targets: {'Values': array([[-2.46275855, -2.76083816, -3.02708342, -3.18470617, -3.26295116,
-3.29789398, -3.30884988, -3.30567727, -3.31830888, -3.3248529 ],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636817, -3.26581578, -3.30278956, -3.31802396],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701567, -3.30686576],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780082, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.84858819, -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984743, 14.66525379, 2.47234783, -1.4139694 ,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475872, 17.72107474, 5.16077726, -0.08199397, -2.12226736,
-2.88874854, -3.17126198, -3.27422222, -3.31125226, -3.32339259],
[13.94655062, 5.41280061, 0.47378806, -1.78729709, -2.71857467,
-3.09305105, -3.24062394, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928477, 0.22803461, -1.64398709, -2.60683311, -3.0337407 ,
-3.21118832, -3.28406823, -3.3135965 , -3.32528326, -3.32940849],
[-0.67919718, -1.63281145, -2.45812666, -2.93394332, -3.1618047 ,
-3.26065235, -3.3029011 , -3.32068652, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
k: value_iteration
aglo_results: {'Values': array([[-2.46275855, -2.76083815, -3.02708342, -3.18470616, -3.26295115,
-3.29789397, -3.30884988, -3.30567726, -3.31830888, -3.32485289],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780083, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.8485882 , -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984742, 14.66525379, 2.47234783, -1.41396941,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475871, 17.72107474, 5.16077725, -0.08199398, -2.12226737,
-2.88874855, -3.17126199, -3.27422222, -3.31125226, -3.32339259],
[13.94655061, 5.4128006 , 0.47378805, -1.7872971 , -2.71857467,
-3.09305106, -3.24062395, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928476, 0.2280346 , -1.6439871 , -2.60683312, -3.03374071,
-3.21118833, -3.28406823, -3.31359651, -3.32528326, -3.3294085 ],
[-0.6791972 , -1.63281146, -2.45812667, -2.93394334, -3.16180472,
-3.26065236, -3.30290111, -3.32068653, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
algo_targets: {'Values': array([[-2.46275855, -2.76083815, -3.02708342, -3.18470616, -3.26295115,
-3.29789397, -3.30884988, -3.30567726, -3.31830888, -3.32485289],
[-1.29862481, -2.08484304, -2.70245737, -3.03813228, -3.19690026,
-3.26660234, -3.28636816, -3.26581577, -3.30278955, -3.31802395],
[ 2.41759508, -0.09673609, -1.79185074, -2.63499652, -3.02416848,
-3.19059199, -3.23147986, -3.12756987, -3.26701566, -3.30686575],
[13.41316138, 5.0978253 , 0.46290021, -1.70402078, -2.65885864,
-3.05780083, -3.21049701, -3.245968 , -3.29642297, -3.3155428 ],
[46.06376653, 18.01479973, 5.55789179, 0.13229418, -2.02689073,
-2.8485882 , -3.15254032, -3.26160562, -3.30443986, -3.31949198],
[ 0. , 43.28984742, 14.66525379, 2.47234783, -1.41396941,
-2.6857767 , -3.11081207, -3.25503909, -3.30466731, -3.32055469],
[46.78475871, 17.72107474, 5.16077725, -0.08199398, -2.12226737,
-2.88874855, -3.17126199, -3.27422222, -3.31125226, -3.32339259],
[13.94655061, 5.4128006 , 0.47378805, -1.7872971 , -2.71857467,
-3.09305106, -3.24062395, -3.29780457, -3.31947287, -3.32685625],
[ 2.81928476, 0.2280346 , -1.6439871 , -2.60683312, -3.03374071,
-3.21118833, -3.28406823, -3.31359651, -3.32528326, -3.3294085 ],
[-0.6791972 , -1.63281146, -2.45812667, -2.93394334, -3.16180472,
-3.26065236, -3.30290111, -3.32068653, -3.3279813 , -3.33063051]]), 'Policy': array([['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'N', 'N', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'N', 'N', 'N', 'S', 'N', 'N', 'N'],
['E', 'E', 'N', 'N', 'N', 'N', 'N', 'W', 'N', 'N'],
['E', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N'],
['W', 'W', 'W', 'W', 'N', 'N', 'N', 'N', 'N', 'N']], dtype=object)}
k: td_lambda
aglo_results: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
algo_targets: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
k: policy_iteration
aglo_results: {'Values': array([[0.06990123, 0.04381939, 0.02781757, 0.02150566, 0.03177758,
0.04843078, 0.0738093 , 0.11235013, 0.16722416, 0.2225751 ],
[0.04381812, 0.02853524, 0.02093494, 0.03018145, 0.04649546,
0.07188254, 0.11118625, 0.1711766 , 0.2567688 , 0.34642434],
[0.02779155, 0.02088371, 0.03007567, 0.04635918, 0.0717817 ,
0.11117895, 0.17214118, 0.26564707, 0.40144695, 0.54980087],
[0.02104052, 0.03009213, 0.04634983, 0.07177349, 0.11117723,
0.17221672, 0.26672727, 0.41230604, 0.62751816, 0.87364793],
[0.03099534, 0.04637978, 0.07176096, 0.11116745, 0.17221352,
0.26677289, 0.41324336, 0.63960307, 0.97995139, 1.38917167],
[0.04714752, 0.07163348, 0.11099575, 0.17206307, 0.26667019,
0.41321143, 0.64017598, 0.99168994, 1.52855546, 2.21043278],
[0.07171064, 0.10952695, 0.17032907, 0.26486022, 0.41154751,
0.63897585, 0.99132254, 1.53684702, 2.38105715, 3.51985474],
[0.10347498, 0.15971313, 0.2510634 , 0.39461385, 0.61963447,
0.97171027, 1.52130989, 2.37673783, 3.70311633, 5.6095095 ],
[0.12557793, 0.19666142, 0.31452166, 0.5044737 , 0.81119701,
1.30803385, 2.11561091, 3.4345435 , 5.7487657 , 8.94760788],
[0.10196562, 0.15462236, 0.23834058, 0.36665112, 0.5622787 ,
0.85905854, 1.29065379, 0.11982362, 8.67888199, 0. ]]), 'Policy': array([['N', 'W', 'W', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['S', 'S', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['S', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'E', 'S', 'S', 'N', 'E', 'N']], dtype=object)}
algo_targets: {'Values': array([[0.06990123, 0.04381939, 0.02781757, 0.02150566, 0.03177758,
0.04843078, 0.0738093 , 0.11235013, 0.16722416, 0.2225751 ],
[0.04381811, 0.02853524, 0.02093493, 0.03018144, 0.04649546,
0.07188254, 0.11118625, 0.1711766 , 0.2567688 , 0.34642434],
[0.02779154, 0.0208837 , 0.03007567, 0.04635918, 0.0717817 ,
0.11117895, 0.17214118, 0.26564707, 0.40144695, 0.54980087],
[0.02104052, 0.03009213, 0.04634982, 0.07177348, 0.11117723,
0.17221672, 0.26672727, 0.41230604, 0.62751816, 0.87364793],
[0.03099534, 0.04637978, 0.07176096, 0.11116745, 0.17221352,
0.26677289, 0.41324336, 0.63960307, 0.97995139, 1.38917167],
[0.04714752, 0.07163348, 0.11099575, 0.17206307, 0.26667019,
0.41321143, 0.64017598, 0.99168994, 1.52855546, 2.21043278],
[0.07171064, 0.10952695, 0.17032907, 0.26486022, 0.41154751,
0.63897585, 0.99132254, 1.53684702, 2.38105715, 3.51985474],
[0.10347498, 0.15971313, 0.2510634 , 0.39461385, 0.61963447,
0.97171027, 1.52130989, 2.37673783, 3.70311633, 5.6095095 ],
[0.12557793, 0.19666142, 0.31452166, 0.5044737 , 0.81119701,
1.30803385, 2.11561091, 3.4345435 , 5.7487657 , 8.94760788],
[0.10196562, 0.15462236, 0.23834058, 0.36665112, 0.5622787 ,
0.85905854, 1.29065379, 0.11982362, 8.67888199, 0. ]]), 'Policy': array([['N', 'W', 'W', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['S', 'S', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['S', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'E', 'S', 'S', 'N', 'E', 'N']], dtype=object)}
k: value_iteration
aglo_results: {'Values': array([[0.06990123, 0.04381939, 0.02781757, 0.02150566, 0.03177757,
0.04843078, 0.0738093 , 0.11235013, 0.16722416, 0.2225751 ],
[0.04381811, 0.02853524, 0.02093493, 0.03018144, 0.04649545,
0.07188254, 0.11118625, 0.1711766 , 0.2567688 , 0.34642434],
[0.02779154, 0.0208837 , 0.03007566, 0.04635918, 0.07178169,
0.11117895, 0.17214117, 0.26564707, 0.40144695, 0.54980087],
[0.02104051, 0.03009213, 0.04634982, 0.07177348, 0.11117723,
0.17221671, 0.26672727, 0.41230604, 0.62751816, 0.87364793],
[0.03099534, 0.04637978, 0.07176095, 0.11116745, 0.17221351,
0.26677289, 0.41324336, 0.63960307, 0.97995139, 1.38917167],
[0.04714752, 0.07163348, 0.11099575, 0.17206307, 0.26667019,
0.41321143, 0.64017598, 0.99168994, 1.52855546, 2.21043278],
[0.07171064, 0.10952695, 0.17032907, 0.26486022, 0.41154751,
0.63897585, 0.99132254, 1.53684702, 2.38105715, 3.51985474],
[0.10347498, 0.15971313, 0.2510634 , 0.39461385, 0.61963447,
0.97171027, 1.52130989, 2.37673783, 3.70311633, 5.6095095 ],
[0.12557792, 0.19666142, 0.31452166, 0.5044737 , 0.81119701,
1.30803385, 2.11561091, 3.4345435 , 5.7487657 , 8.94760788],
[0.10196561, 0.15462236, 0.23834058, 0.36665112, 0.5622787 ,
0.85905854, 1.29065379, 0.11982362, 8.67888199, 0. ]]), 'Policy': array([['N', 'W', 'W', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['S', 'S', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['S', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'E', 'S', 'S', 'N', 'E', 'N']], dtype=object)}
algo_targets: {'Values': array([[0.06990123, 0.04381939, 0.02781757, 0.02150566, 0.03177757,
0.04843078, 0.0738093 , 0.11235013, 0.16722416, 0.2225751 ],
[0.04381811, 0.02853524, 0.02093493, 0.03018144, 0.04649545,
0.07188254, 0.11118625, 0.1711766 , 0.2567688 , 0.34642434],
[0.02779154, 0.0208837 , 0.03007566, 0.04635918, 0.07178169,
0.11117895, 0.17214117, 0.26564707, 0.40144695, 0.54980087],
[0.02104051, 0.03009213, 0.04634982, 0.07177348, 0.11117723,
0.17221671, 0.26672727, 0.41230604, 0.62751816, 0.87364793],
[0.03099534, 0.04637978, 0.07176095, 0.11116745, 0.17221351,
0.26677289, 0.41324336, 0.63960307, 0.97995139, 1.38917167],
[0.04714752, 0.07163348, 0.11099575, 0.17206307, 0.26667019,
0.41321143, 0.64017598, 0.99168994, 1.52855546, 2.21043278],
[0.07171064, 0.10952695, 0.17032907, 0.26486022, 0.41154751,
0.63897585, 0.99132254, 1.53684702, 2.38105715, 3.51985474],
[0.10347498, 0.15971313, 0.2510634 , 0.39461385, 0.61963447,
0.97171027, 1.52130989, 2.37673783, 3.70311633, 5.6095095 ],
[0.12557792, 0.19666142, 0.31452166, 0.5044737 , 0.81119701,
1.30803385, 2.11561091, 3.4345435 , 5.7487657 , 8.94760788],
[0.10196561, 0.15462236, 0.23834058, 0.36665112, 0.5622787 ,
0.85905854, 1.29065379, 0.11982362, 8.67888199, 0. ]]), 'Policy': array([['N', 'W', 'W', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['S', 'S', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['S', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'N', 'E', 'E', 'E', 'N', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N', 'N'],
['N', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N', 'N'],
['E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'E', 'N'],
['E', 'E', 'E', 'E', 'E', 'S', 'S', 'N', 'E', 'N']], dtype=object)}
k: td_lambda
aglo_results: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
algo_targets: {'Values': array([[1.17065175e-01, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 1.20869146e-02, 6.50801063e-03, 1.08455100e-01,
1.25939840e-01, 0.00000000e+00],
[0.00000000e+00, 0.00000000e+00, 9.30697487e-03, 6.74433462e-03,
2.87816477e-02, 3.12467594e-02, 1.03059572e-01, 1.52781881e-01,
1.58366091e-01, 0.00000000e+00],
[1.77384263e-03, 1.47800884e-02, 2.74846931e-02, 3.04573845e-02,
7.14399810e-02, 1.01562738e-01, 1.53524012e-01, 2.30581627e-01,
1.78870946e-01, 1.75414748e-01],
[6.40534487e-03, 2.82016679e-02, 3.19684901e-02, 5.26038043e-02,
7.84100241e-02, 1.72884035e-01, 1.99857466e-01, 3.47990968e-01,
5.79664376e-01, 2.56996466e-01],
[2.04541062e-02, 4.19457138e-02, 5.22520506e-02, 1.02433955e-01,
1.58553992e-01, 2.27612595e-01, 3.84148807e-01, 5.65629731e-01,
1.07566085e+00, 9.74159503e-01],
[2.39275526e-02, 6.98107944e-02, 8.44269638e-02, 1.09999353e-01,
2.47482489e-01, 4.01109042e-01, 5.24005132e-01, 9.62735996e-01,
1.61645974e+00, 1.43942491e+00],
[2.09996045e-02, 8.22097499e-02, 2.10721662e-01, 3.12594289e-01,
4.84813194e-01, 8.16088700e-01, 1.29269479e+00, 1.65792382e+00,
2.20209915e+00, 3.39107140e+00],
[0.00000000e+00, 5.22314165e-02, 2.41595651e-01, 4.22467516e-01,
6.25736022e-01, 7.12439438e-01, 2.08346370e+00, 3.28464640e+00,
3.79746486e+00, 5.89371046e+00],
[0.00000000e+00, 0.00000000e+00, 4.14289002e-02, 1.78576928e-01,
9.12966633e-01, 1.40156387e+00, 1.27983718e+00, 4.84976577e+00,
6.98025075e+00, 9.92256338e+00],
[0.00000000e+00, 0.00000000e+00, 6.74471744e-03, 1.92706213e-02,
3.49830663e-02, 5.96848511e-02, 8.28928265e-02, 1.05060024e-01,
1.00046447e+01, 0.00000000e+00]])}
Shared data Score (normalized to 1): 1.0