936 lines
27 KiB
Plaintext
936 lines
27 KiB
Plaintext
weights_k_0: """
|
|
{((0, 1), 'exit'): 0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): 0,
|
|
((0, 4), 'exit'): 0,
|
|
((0, 5), 'exit'): 0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): 0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_0_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_0_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_0_action_exit: """
|
|
__________ 0.0000 __________
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_0_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_0_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_1: """
|
|
{((0, 1), 'exit'): 0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): 0,
|
|
((0, 4), 'exit'): 0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): 0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_1_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_1_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_1_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_1_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_1_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_2: """
|
|
{((0, 1), 'exit'): 0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): 0,
|
|
((0, 4), 'exit'): 0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): 0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_2_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_2_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_2_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_2_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_2_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_3: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): 0,
|
|
((0, 4), 'exit'): 0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): 0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_3_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_3_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_3_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_3_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_3_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_4: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): 0,
|
|
((0, 4), 'exit'): -10.0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): 0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_4_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_4_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_4_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
0.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_4_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_4_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_5: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): 0,
|
|
((0, 4), 'exit'): -10.0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): -10.0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_5_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_5_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_5_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
0.0000 illegal -10.0000
|
|
0.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_5_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_5_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_6: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): -10.0,
|
|
((0, 4), 'exit'): -10.0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): -10.0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_6_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_6_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_6_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal -10.0000
|
|
0.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_6_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_6_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_7: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): 0,
|
|
((0, 3), 'exit'): -10.0,
|
|
((0, 4), 'exit'): -10.0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0.0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): -10.0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_7_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_7_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_7_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal -10.0000
|
|
0.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_7_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_7_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_8: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): -10.0,
|
|
((0, 3), 'exit'): -10.0,
|
|
((0, 4), 'exit'): -10.0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0.0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): -10.0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_8_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_8_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_8_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal -10.0000
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.0000 __________
|
|
"""
|
|
|
|
q_values_k_8_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_8_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_9: """
|
|
{((0, 1), 'exit'): -10.0,
|
|
((0, 2), 'exit'): -10.0,
|
|
((0, 3), 'exit'): -10.0,
|
|
((0, 4), 'exit'): -10.0,
|
|
((0, 5), 'exit'): -10.0,
|
|
((1, 0), 'exit'): 0.1,
|
|
((1, 1), 'east'): 0,
|
|
((1, 1), 'north'): 0,
|
|
((1, 1), 'south'): 0,
|
|
((1, 1), 'west'): 0,
|
|
((1, 2), 'east'): 0,
|
|
((1, 2), 'north'): 0,
|
|
((1, 2), 'south'): 0,
|
|
((1, 2), 'west'): 0,
|
|
((1, 3), 'east'): 0,
|
|
((1, 3), 'north'): 0,
|
|
((1, 3), 'south'): 0.0,
|
|
((1, 3), 'west'): 0,
|
|
((1, 4), 'east'): 0,
|
|
((1, 4), 'north'): 0,
|
|
((1, 4), 'south'): 0,
|
|
((1, 4), 'west'): 0,
|
|
((1, 5), 'east'): 0,
|
|
((1, 5), 'north'): 0,
|
|
((1, 5), 'south'): 0.0,
|
|
((1, 5), 'west'): 0,
|
|
((1, 6), 'exit'): 0,
|
|
((2, 1), 'exit'): 0,
|
|
((2, 2), 'exit'): 0,
|
|
((2, 3), 'exit'): -10.0,
|
|
((2, 4), 'exit'): 0,
|
|
((2, 5), 'exit'): 0}
|
|
"""
|
|
|
|
q_values_k_9_action_north: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_9_action_east: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_9_action_exit: """
|
|
__________ 0.0000 __________
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal -10.0000
|
|
-10.0000 illegal 0.0000
|
|
-10.0000 illegal 0.0000
|
|
__________ 0.1000 __________
|
|
"""
|
|
|
|
q_values_k_9_action_south: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_9_action_west: """
|
|
__________ illegal __________
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
illegal 0.0000 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
weights_k_500: """
|
|
{((0, 1), 'exit'): -92.82102012308148,
|
|
((0, 2), 'exit'): -97.21871610556306,
|
|
((0, 3), 'exit'): -89.05810108684878,
|
|
((0, 4), 'exit'): -97.74716004550608,
|
|
((0, 5), 'exit'): -96.56631617970748,
|
|
((1, 0), 'exit'): 0.9576088417247839,
|
|
((1, 1), 'east'): -31.68839649871871,
|
|
((1, 1), 'north'): -0.5871409700255297,
|
|
((1, 1), 'south'): -5.571799344704395,
|
|
((1, 1), 'west'): -20.777007017445538,
|
|
((1, 2), 'east'): -43.595242197319,
|
|
((1, 2), 'north'): -1.264202431807023,
|
|
((1, 2), 'south'): -8.401530599975509,
|
|
((1, 2), 'west'): -16.283916171605192,
|
|
((1, 3), 'east'): -3.6956691,
|
|
((1, 3), 'north'): -0.16712710492783758,
|
|
((1, 3), 'south'): -3.4722840178579073,
|
|
((1, 3), 'west'): -40.58867937480968,
|
|
((1, 4), 'east'): -26.553386621338632,
|
|
((1, 4), 'north'): -0.799493322153628,
|
|
((1, 4), 'south'): -6.727671187497919,
|
|
((1, 4), 'west'): -39.06095135014759,
|
|
((1, 5), 'east'): -17.067638934181446,
|
|
((1, 5), 'north'): -5.864753060887024,
|
|
((1, 5), 'south'): -6.83769420759525,
|
|
((1, 5), 'west'): -27.062643066307515,
|
|
((1, 6), 'exit'): 9.353891811077332,
|
|
((2, 1), 'exit'): -97.21871610556306,
|
|
((2, 2), 'exit'): -87.84233454094309,
|
|
((2, 3), 'exit'): -96.90968456173674,
|
|
((2, 4), 'exit'): -94.185026299696,
|
|
((2, 5), 'exit'): -96.90968456173674}
|
|
"""
|
|
|
|
q_values_k_500_action_north: """
|
|
__________ illegal __________
|
|
illegal -5.8648 illegal
|
|
illegal -0.7995 illegal
|
|
illegal -0.1671 illegal
|
|
illegal -1.2642 illegal
|
|
illegal -0.5871 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_500_action_east: """
|
|
__________ illegal __________
|
|
illegal -17.0676 illegal
|
|
illegal -26.5534 illegal
|
|
illegal -3.6957 illegal
|
|
illegal -43.5952 illegal
|
|
illegal -31.6884 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_500_action_exit: """
|
|
__________ 9.3539 __________
|
|
-96.5663 illegal -96.9097
|
|
-97.7472 illegal -94.1850
|
|
-89.0581 illegal -96.9097
|
|
-97.2187 illegal -87.8423
|
|
-92.8210 illegal -97.2187
|
|
__________ 0.9576 __________
|
|
"""
|
|
|
|
q_values_k_500_action_south: """
|
|
__________ illegal __________
|
|
illegal -6.8377 illegal
|
|
illegal -6.7277 illegal
|
|
illegal -3.4723 illegal
|
|
illegal -8.4015 illegal
|
|
illegal -5.5718 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|
|
q_values_k_500_action_west: """
|
|
__________ illegal __________
|
|
illegal -27.0626 illegal
|
|
illegal -39.0610 illegal
|
|
illegal -40.5887 illegal
|
|
illegal -16.2839 illegal
|
|
illegal -20.7770 illegal
|
|
__________ illegal __________
|
|
"""
|
|
|