intro2ai/p3_rl/test_cases/q4/2-tinygrid-noisy.solution

343 lines
5.1 KiB
Plaintext
Raw Normal View History

2021-11-27 16:16:51 +01:00
q_values_k_0_action_north: """
illegal
0.0000
illegal
"""
q_values_k_0_action_east: """
illegal
0.0000
illegal
"""
q_values_k_0_action_exit: """
0.0000
illegal
0.0000
"""
q_values_k_0_action_south: """
illegal
0.0000
illegal
"""
q_values_k_0_action_west: """
illegal
0.0000
illegal
"""
q_values_k_1_action_north: """
illegal
0.0000
illegal
"""
q_values_k_1_action_east: """
illegal
0.0000
illegal
"""
q_values_k_1_action_exit: """
0.0000
illegal
1.0000
"""
q_values_k_1_action_south: """
illegal
0.0000
illegal
"""
q_values_k_1_action_west: """
illegal
0.0000
illegal
"""
q_values_k_2_action_north: """
illegal
0.0000
illegal
"""
q_values_k_2_action_east: """
illegal
0.0000
illegal
"""
q_values_k_2_action_exit: """
0.0000
illegal
1.0000
"""
q_values_k_2_action_south: """
illegal
0.0000
illegal
"""
q_values_k_2_action_west: """
illegal
0.0000
illegal
"""
q_values_k_3_action_north: """
illegal
0.0000
illegal
"""
q_values_k_3_action_east: """
illegal
0.0000
illegal
"""
q_values_k_3_action_exit: """
0.0000
illegal
1.9000
"""
q_values_k_3_action_south: """
illegal
0.0000
illegal
"""
q_values_k_3_action_west: """
illegal
0.0000
illegal
"""
q_values_k_4_action_north: """
illegal
0.0000
illegal
"""
q_values_k_4_action_east: """
illegal
0.0000
illegal
"""
q_values_k_4_action_exit: """
0.0000
illegal
2.7100
"""
q_values_k_4_action_south: """
illegal
0.0000
illegal
"""
q_values_k_4_action_west: """
illegal
0.0000
illegal
"""
q_values_k_5_action_north: """
illegal
0.0000
illegal
"""
q_values_k_5_action_east: """
illegal
0.0000
illegal
"""
q_values_k_5_action_exit: """
-1.0000
illegal
2.7100
"""
q_values_k_5_action_south: """
illegal
0.0000
illegal
"""
q_values_k_5_action_west: """
illegal
0.0000
illegal
"""
q_values_k_6_action_north: """
illegal
0.0000
illegal
"""
q_values_k_6_action_east: """
illegal
0.0000
illegal
"""
q_values_k_6_action_exit: """
-1.0000
illegal
3.4390
"""
q_values_k_6_action_south: """
illegal
0.0000
illegal
"""
q_values_k_6_action_west: """
illegal
0.0000
illegal
"""
q_values_k_7_action_north: """
illegal
0.0000
illegal
"""
q_values_k_7_action_east: """
illegal
0.0000
illegal
"""
q_values_k_7_action_exit: """
-1.0000
illegal
3.4390
"""
q_values_k_7_action_south: """
illegal
0.2579
illegal
"""
q_values_k_7_action_west: """
illegal
0.0000
illegal
"""
q_values_k_8_action_north: """
illegal
0.0000
illegal
"""
q_values_k_8_action_east: """
illegal
0.0000
illegal
"""
q_values_k_8_action_exit: """
-1.0000
illegal
4.0951
"""
q_values_k_8_action_south: """
illegal
0.2579
illegal
"""
q_values_k_8_action_west: """
illegal
0.0000
illegal
"""
q_values_k_9_action_north: """
illegal
0.0000
illegal
"""
q_values_k_9_action_east: """
illegal
0.0000
illegal
"""
q_values_k_9_action_exit: """
-1.0000
illegal
4.6856
"""
q_values_k_9_action_south: """
illegal
0.2579
illegal
"""
q_values_k_9_action_west: """
illegal
0.0000
illegal
"""
q_values_k_100_action_north: """
illegal
-0.6670
illegal
"""
q_values_k_100_action_east: """
illegal
0.9499
illegal
"""
q_values_k_100_action_exit: """
-9.4767
illegal
9.8175
"""
q_values_k_100_action_south: """
illegal
3.2562
illegal
"""
q_values_k_100_action_west: """
illegal
0.8236
illegal
"""
values: """
-9.4767
3.2562
9.8175
"""
policy: """
exit
south
exit
"""