457 lines
22 KiB
Plaintext
457 lines
22 KiB
Plaintext
q_values_k_0_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_0_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_0_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
0.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_0_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_0_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_1_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_1_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_1_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
0.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_1_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_1_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_2_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_2_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_2_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
0.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_2_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_2_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_3_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_3_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_3_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_3_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_3_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_4_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_4_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_4_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_4_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_4_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_5_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_5_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_5_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_5_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_5_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_6_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_6_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_6_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
-1.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_6_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_6_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_7_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_7_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_7_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
-1.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.1000 illegal illegal
|
|
0.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_7_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_7_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_8_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_8_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_8_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
-1.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.1000 illegal illegal
|
|
-1.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_8_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_8_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_9_action_north: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal -0.0900 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_9_action_east: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_9_action_exit: """
|
|
0.0000 illegal 0.0000 illegal illegal
|
|
-1.0000 illegal __________ illegal illegal
|
|
0.0000 illegal 0.1000 illegal illegal
|
|
-1.0000 illegal __________ __________ illegal
|
|
-1.0000 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_9_action_south: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_9_action_west: """
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ 0.0000 0.0000
|
|
illegal 0.0000 illegal 0.0000 0.0000
|
|
illegal 0.0000 __________ __________ 0.0000
|
|
illegal 0.0000 0.0000 0.0000 0.0000
|
|
"""
|
|
|
|
q_values_k_3000_action_north: """
|
|
illegal 4.3205 illegal 6.1517 3.8095
|
|
illegal 4.4238 __________ 5.2284 3.5129
|
|
illegal 1.0694 illegal 3.6867 2.0418
|
|
illegal 0.3423 __________ __________ 1.0655
|
|
illegal 0.0073 0.0079 0.0484 0.3768
|
|
"""
|
|
|
|
q_values_k_3000_action_east: """
|
|
illegal 8.0584 illegal 3.7245 3.3947
|
|
illegal 2.0499 __________ 3.2373 2.1742
|
|
illegal 0.8687 illegal 1.7398 1.2671
|
|
illegal 0.2927 __________ __________ 0.6669
|
|
illegal 0.0239 0.0097 0.1611 0.2051
|
|
"""
|
|
|
|
q_values_k_3000_action_exit: """
|
|
-10.0000 illegal 10.0000 illegal illegal
|
|
-10.0000 illegal __________ illegal illegal
|
|
-10.0000 illegal 1.0000 illegal illegal
|
|
-10.0000 illegal __________ __________ illegal
|
|
-9.9999 illegal illegal illegal illegal
|
|
"""
|
|
|
|
q_values_k_3000_action_south: """
|
|
illegal -0.3521 illegal 3.6948 2.9139
|
|
illegal -0.5605 __________ 2.1346 1.5674
|
|
illegal 0.2093 illegal 1.5389 0.5521
|
|
illegal -0.5505 __________ __________ 0.1006
|
|
illegal -1.8501 0.0060 0.0514 0.1223
|
|
"""
|
|
|
|
q_values_k_3000_action_west: """
|
|
illegal -6.2001 illegal 7.5146 4.9014
|
|
illegal -5.4013 __________ 4.0484 3.4126
|
|
illegal -8.0399 illegal 0.9653 1.6081
|
|
illegal -7.4767 __________ __________ 0.3934
|
|
illegal -6.3432 0.0179 0.0188 0.1028
|
|
"""
|
|
|
|
values: """
|
|
-10.0000 8.0584 10.0000 7.5146 4.9014
|
|
-10.0000 4.4238 __________ 5.2284 3.5129
|
|
-10.0000 1.0694 1.0000 3.6867 2.0418
|
|
-10.0000 0.3423 __________ __________ 1.0655
|
|
-9.9999 0.0239 0.0179 0.1611 0.3768
|
|
"""
|
|
|
|
policy: """
|
|
exit east exit west west
|
|
exit north __________ north north
|
|
exit north exit north north
|
|
exit north __________ __________ north
|
|
exit east west east north
|
|
"""
|
|
|