343 lines
5.1 KiB
Plaintext
343 lines
5.1 KiB
Plaintext
q_values_k_0_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_0_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_0_action_exit: """
|
|
0.0000
|
|
illegal
|
|
0.0000
|
|
"""
|
|
|
|
q_values_k_0_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_0_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_1_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_1_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_1_action_exit: """
|
|
0.0000
|
|
illegal
|
|
1.0000
|
|
"""
|
|
|
|
q_values_k_1_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_1_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_2_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_2_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_2_action_exit: """
|
|
0.0000
|
|
illegal
|
|
1.0000
|
|
"""
|
|
|
|
q_values_k_2_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_2_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_3_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_3_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_3_action_exit: """
|
|
0.0000
|
|
illegal
|
|
1.9000
|
|
"""
|
|
|
|
q_values_k_3_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_3_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_4_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_4_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_4_action_exit: """
|
|
0.0000
|
|
illegal
|
|
2.7100
|
|
"""
|
|
|
|
q_values_k_4_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_4_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_5_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_5_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_5_action_exit: """
|
|
-1.0000
|
|
illegal
|
|
2.7100
|
|
"""
|
|
|
|
q_values_k_5_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_5_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_6_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_6_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_6_action_exit: """
|
|
-1.0000
|
|
illegal
|
|
3.4390
|
|
"""
|
|
|
|
q_values_k_6_action_south: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_6_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_7_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_7_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_7_action_exit: """
|
|
-1.0000
|
|
illegal
|
|
3.4390
|
|
"""
|
|
|
|
q_values_k_7_action_south: """
|
|
illegal
|
|
0.2579
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_7_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_8_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_8_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_8_action_exit: """
|
|
-1.0000
|
|
illegal
|
|
4.0951
|
|
"""
|
|
|
|
q_values_k_8_action_south: """
|
|
illegal
|
|
0.2579
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_8_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_9_action_north: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_9_action_east: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_9_action_exit: """
|
|
-1.0000
|
|
illegal
|
|
4.6856
|
|
"""
|
|
|
|
q_values_k_9_action_south: """
|
|
illegal
|
|
0.2579
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_9_action_west: """
|
|
illegal
|
|
0.0000
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_100_action_north: """
|
|
illegal
|
|
-0.6670
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_100_action_east: """
|
|
illegal
|
|
0.9499
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_100_action_exit: """
|
|
-9.4767
|
|
illegal
|
|
9.8175
|
|
"""
|
|
|
|
q_values_k_100_action_south: """
|
|
illegal
|
|
3.2562
|
|
illegal
|
|
"""
|
|
|
|
q_values_k_100_action_west: """
|
|
illegal
|
|
0.8236
|
|
illegal
|
|
"""
|
|
|
|
values: """
|
|
-9.4767
|
|
3.2562
|
|
9.8175
|
|
"""
|
|
|
|
policy: """
|
|
exit
|
|
south
|
|
exit
|
|
"""
|
|
|