411 lines
5.9 KiB
Plaintext
411 lines
5.9 KiB
Plaintext
|
values_k_0: """
|
||
|
0.0000
|
||
|
0.0000
|
||
|
0.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_north: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_south: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_0_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_1: """
|
||
|
-10.0000
|
||
|
0.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_east: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_1_action_west: """
|
||
|
illegal
|
||
|
0.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_2: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_2_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_3: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_3_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_4: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_4_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_5: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_5_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_6: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_6_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_7: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_7_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_8: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_8_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_9: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_9_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
values_k_100: """
|
||
|
-10.0000
|
||
|
5.0000
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_north: """
|
||
|
illegal
|
||
|
-5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_east: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_exit: """
|
||
|
-10.0000
|
||
|
illegal
|
||
|
10.0000
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_south: """
|
||
|
illegal
|
||
|
5.0000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
q_values_k_100_action_west: """
|
||
|
illegal
|
||
|
2.5000
|
||
|
illegal
|
||
|
"""
|
||
|
|
||
|
policy: """
|
||
|
exit
|
||
|
south
|
||
|
exit
|
||
|
"""
|
||
|
|
||
|
actions: """
|
||
|
north
|
||
|
east
|
||
|
exit
|
||
|
south
|
||
|
west
|
||
|
"""
|
||
|
|