430 lines
6.9 KiB
Plaintext
430 lines
6.9 KiB
Plaintext
|
weights_k_0: """
|
||
|
{((0, 0), 'exit'): 0,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): 0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_exit: """
|
||
|
0.0000
|
||
|
illegal
|
||
|
0.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_1: """
|
||
|
{((0, 0), 'exit'): 1.0,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): 0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_exit: """
|
||
|
0.0000
|
||
|
illegal
|
||
|
1.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_2: """
|
||
|
{((0, 0), 'exit'): 1.0,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): 0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_exit: """
|
||
|
0.0000
|
||
|
illegal
|
||
|
1.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_3: """
|
||
|
{((0, 0), 'exit'): 1.9,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): 0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_exit: """
|
||
|
0.0000
|
||
|
illegal
|
||
|
1.9000
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_4: """
|
||
|
{((0, 0), 'exit'): 2.71,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): 0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_exit: """
|
||
|
0.0000
|
||
|
illegal
|
||
|
2.7100
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_5: """
|
||
|
{((0, 0), 'exit'): 2.71,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): -1.0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_exit: """
|
||
|
-1.0000
|
||
|
illegal
|
||
|
2.7100
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_6: """
|
||
|
{((0, 0), 'exit'): 3.439,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.0,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): -1.0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_exit: """
|
||
|
-1.0000
|
||
|
illegal
|
||
|
3.4390
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_7: """
|
||
|
{((0, 0), 'exit'): 3.439,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.17195000000000002,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): -1.0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_exit: """
|
||
|
-1.0000
|
||
|
illegal
|
||
|
3.4390
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_south: """
|
||
|
illegal
|
||
|
0.1720
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_8: """
|
||
|
{((0, 0), 'exit'): 4.0951,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.17195000000000002,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): -1.0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_exit: """
|
||
|
-1.0000
|
||
|
illegal
|
||
|
4.0951
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_south: """
|
||
|
illegal
|
||
|
0.1720
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_9: """
|
||
|
{((0, 0), 'exit'): 4.68559,
|
||
|
((0, 1), 'east'): 0,
|
||
|
((0, 1), 'north'): 0,
|
||
|
((0, 1), 'south'): 0.17195000000000002,
|
||
|
((0, 1), 'west'): 0,
|
||
|
((0, 2), 'exit'): -1.0}
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_exit: """
|
||
|
-1.0000
|
||
|
illegal
|
||
|
4.6856
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_south: """
|
||
|
illegal
|
||
|
0.1720
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
weights_k_100: """
|
||
|
{((0, 0), 'exit'): 9.817519963685992,
|
||
|
((0, 1), 'east'): 0.40629236674335106,
|
||
|
((0, 1), 'north'): -0.4534185789984799,
|
||
|
((0, 1), 'south'): 2.126721095524319,
|
||
|
((0, 1), 'west'): 0.39193283364906867,
|
||
|
((0, 2), 'exit'): -9.476652366972639}
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_north: """
|
||
|
illegal
|
||
|
-0.4534
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_east: """
|
||
|
illegal
|
||
|
0.4063
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_exit: """
|
||
|
-9.4767
|
||
|
illegal
|
||
|
9.8175
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_south: """
|
||
|
illegal
|
||
|
2.1267
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_west: """
|
||
|
illegal
|
||
|
0.3919
|
||
|
illegal
|
||
|
"""
|
||
|
|