intro2ai/p3_rl/test_cases/q8/3-bridge.solution

936 lines
27 KiB
Plaintext

weights_k_0: """
{((0, 1), 'exit'): 0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): 0,
((0, 4), 'exit'): 0,
((0, 5), 'exit'): 0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): 0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_0_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_0_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_0_action_exit: """
__________ 0.0000 __________
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_0_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_0_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_1: """
{((0, 1), 'exit'): 0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): 0,
((0, 4), 'exit'): 0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): 0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_1_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_1_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_1_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_1_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_1_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_2: """
{((0, 1), 'exit'): 0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): 0,
((0, 4), 'exit'): 0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): 0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_2_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_2_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_2_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_2_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_2_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_3: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): 0,
((0, 4), 'exit'): 0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): 0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_3_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_3_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_3_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_3_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_3_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_4: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): 0,
((0, 4), 'exit'): -10.0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): 0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_4_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_4_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_4_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
0.0000 illegal 0.0000
0.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_4_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_4_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_5: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): 0,
((0, 4), 'exit'): -10.0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): -10.0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_5_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_5_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_5_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
0.0000 illegal -10.0000
0.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_5_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_5_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_6: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): -10.0,
((0, 4), 'exit'): -10.0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): -10.0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_6_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_6_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_6_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
-10.0000 illegal -10.0000
0.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_6_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_6_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_7: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): 0,
((0, 3), 'exit'): -10.0,
((0, 4), 'exit'): -10.0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0.0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): -10.0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_7_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_7_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_7_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
-10.0000 illegal -10.0000
0.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_7_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_7_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_8: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): -10.0,
((0, 3), 'exit'): -10.0,
((0, 4), 'exit'): -10.0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0.0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): -10.0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_8_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_8_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_8_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
-10.0000 illegal -10.0000
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.0000 __________
"""
q_values_k_8_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_8_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_9: """
{((0, 1), 'exit'): -10.0,
((0, 2), 'exit'): -10.0,
((0, 3), 'exit'): -10.0,
((0, 4), 'exit'): -10.0,
((0, 5), 'exit'): -10.0,
((1, 0), 'exit'): 0.1,
((1, 1), 'east'): 0,
((1, 1), 'north'): 0,
((1, 1), 'south'): 0,
((1, 1), 'west'): 0,
((1, 2), 'east'): 0,
((1, 2), 'north'): 0,
((1, 2), 'south'): 0,
((1, 2), 'west'): 0,
((1, 3), 'east'): 0,
((1, 3), 'north'): 0,
((1, 3), 'south'): 0.0,
((1, 3), 'west'): 0,
((1, 4), 'east'): 0,
((1, 4), 'north'): 0,
((1, 4), 'south'): 0,
((1, 4), 'west'): 0,
((1, 5), 'east'): 0,
((1, 5), 'north'): 0,
((1, 5), 'south'): 0.0,
((1, 5), 'west'): 0,
((1, 6), 'exit'): 0,
((2, 1), 'exit'): 0,
((2, 2), 'exit'): 0,
((2, 3), 'exit'): -10.0,
((2, 4), 'exit'): 0,
((2, 5), 'exit'): 0}
"""
q_values_k_9_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_9_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_9_action_exit: """
__________ 0.0000 __________
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
-10.0000 illegal -10.0000
-10.0000 illegal 0.0000
-10.0000 illegal 0.0000
__________ 0.1000 __________
"""
q_values_k_9_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_9_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
weights_k_500: """
{((0, 1), 'exit'): -92.82102012308148,
((0, 2), 'exit'): -97.21871610556306,
((0, 3), 'exit'): -89.05810108684878,
((0, 4), 'exit'): -97.74716004550608,
((0, 5), 'exit'): -96.56631617970748,
((1, 0), 'exit'): 0.9576088417247839,
((1, 1), 'east'): -31.68839649871871,
((1, 1), 'north'): -0.5871409700255297,
((1, 1), 'south'): -5.571799344704395,
((1, 1), 'west'): -20.777007017445538,
((1, 2), 'east'): -43.595242197319,
((1, 2), 'north'): -1.264202431807023,
((1, 2), 'south'): -8.401530599975509,
((1, 2), 'west'): -16.283916171605192,
((1, 3), 'east'): -3.6956691,
((1, 3), 'north'): -0.16712710492783758,
((1, 3), 'south'): -3.4722840178579073,
((1, 3), 'west'): -40.58867937480968,
((1, 4), 'east'): -26.553386621338632,
((1, 4), 'north'): -0.799493322153628,
((1, 4), 'south'): -6.727671187497919,
((1, 4), 'west'): -39.06095135014759,
((1, 5), 'east'): -17.067638934181446,
((1, 5), 'north'): -5.864753060887024,
((1, 5), 'south'): -6.83769420759525,
((1, 5), 'west'): -27.062643066307515,
((1, 6), 'exit'): 9.353891811077332,
((2, 1), 'exit'): -97.21871610556306,
((2, 2), 'exit'): -87.84233454094309,
((2, 3), 'exit'): -96.90968456173674,
((2, 4), 'exit'): -94.185026299696,
((2, 5), 'exit'): -96.90968456173674}
"""
q_values_k_500_action_north: """
__________ illegal __________
illegal -5.8648 illegal
illegal -0.7995 illegal
illegal -0.1671 illegal
illegal -1.2642 illegal
illegal -0.5871 illegal
__________ illegal __________
"""
q_values_k_500_action_east: """
__________ illegal __________
illegal -17.0676 illegal
illegal -26.5534 illegal
illegal -3.6957 illegal
illegal -43.5952 illegal
illegal -31.6884 illegal
__________ illegal __________
"""
q_values_k_500_action_exit: """
__________ 9.3539 __________
-96.5663 illegal -96.9097
-97.7472 illegal -94.1850
-89.0581 illegal -96.9097
-97.2187 illegal -87.8423
-92.8210 illegal -97.2187
__________ 0.9576 __________
"""
q_values_k_500_action_south: """
__________ illegal __________
illegal -6.8377 illegal
illegal -6.7277 illegal
illegal -3.4723 illegal
illegal -8.4015 illegal
illegal -5.5718 illegal
__________ illegal __________
"""
q_values_k_500_action_west: """
__________ illegal __________
illegal -27.0626 illegal
illegal -39.0610 illegal
illegal -40.5887 illegal
illegal -16.2839 illegal
illegal -20.7770 illegal
__________ illegal __________
"""