intro2ai/p3_rl/test_cases/q1/3-bridge.solution

679 lines
23 KiB
Plaintext

values_k_0: """
__________ 0.0000 __________
0.0000 0.0000 0.0000
0.0000 0.0000 0.0000
0.0000 0.0000 0.0000
0.0000 0.0000 0.0000
0.0000 0.0000 0.0000
__________ 0.0000 __________
"""
q_values_k_0_action_north: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_0_action_east: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_0_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_0_action_south: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
q_values_k_0_action_west: """
__________ illegal __________
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
illegal 0.0000 illegal
__________ illegal __________
"""
values_k_1: """
__________ 10.0000 __________
-100.0000 0.0000 -100.0000
-100.0000 0.0000 -100.0000
-100.0000 0.0000 -100.0000
-100.0000 0.0000 -100.0000
-100.0000 0.0000 -100.0000
__________ 1.0000 __________
"""
q_values_k_1_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -8.5000 illegal
illegal -8.5000 illegal
illegal -8.5000 illegal
illegal -8.5000 illegal
__________ illegal __________
"""
q_values_k_1_action_east: """
__________ illegal __________
illegal -76.0750 illegal
illegal -76.5000 illegal
illegal -76.5000 illegal
illegal -76.5000 illegal
illegal -76.4575 illegal
__________ illegal __________
"""
q_values_k_1_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_1_action_south: """
__________ illegal __________
illegal -8.5000 illegal
illegal -8.5000 illegal
illegal -8.5000 illegal
illegal -8.5000 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_1_action_west: """
__________ illegal __________
illegal -76.0750 illegal
illegal -76.5000 illegal
illegal -76.5000 illegal
illegal -76.5000 illegal
illegal -76.4575 illegal
__________ illegal __________
"""
values_k_2: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -8.5000 -100.0000
-100.0000 -8.5000 -100.0000
-100.0000 -8.5000 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_2_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.0025 illegal
illegal -15.0025 illegal
illegal -15.0025 illegal
__________ illegal __________
"""
q_values_k_2_action_east: """
__________ illegal __________
illegal -76.4363 illegal
illegal -76.8974 illegal
illegal -77.2225 illegal
illegal -77.1900 illegal
illegal -76.8187 illegal
__________ illegal __________
"""
q_values_k_2_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_2_action_south: """
__________ illegal __________
illegal -15.0025 illegal
illegal -15.0025 illegal
illegal -15.0025 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_2_action_west: """
__________ illegal __________
illegal -76.4363 illegal
illegal -76.8974 illegal
illegal -77.2225 illegal
illegal -77.1900 illegal
illegal -76.8187 illegal
__________ illegal __________
"""
values_k_3: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.0025 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_3_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -19.9769 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_3_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1737 illegal
illegal -77.5016 illegal
illegal -77.4663 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_3_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_3_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -19.9769 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_3_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1737 illegal
illegal -77.5016 illegal
illegal -77.4663 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_4: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_4_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_4_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_4_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_4_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_4_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_5: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_5_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_5_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_5_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_5_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_5_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_6: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_6_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_6_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_6_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_6_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_6_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_7: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_7_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_7_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_7_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_7_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_7_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_8: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_8_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_8_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_8_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_8_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_8_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_9: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_9_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_9_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_9_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_9_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_9_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
values_k_100: """
__________ 10.0000 __________
-100.0000 -0.8500 -100.0000
-100.0000 -9.1502 -100.0000
-100.0000 -15.4999 -100.0000
-100.0000 -14.4173 -100.0000
-100.0000 -7.7350 -100.0000
__________ 1.0000 __________
"""
q_values_k_100_action_north: """
__________ illegal __________
illegal -0.8500 illegal
illegal -9.1502 illegal
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
__________ illegal __________
"""
q_values_k_100_action_east: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
q_values_k_100_action_exit: """
__________ 10.0000 __________
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
-100.0000 illegal -100.0000
__________ 1.0000 __________
"""
q_values_k_100_action_south: """
__________ illegal __________
illegal -15.4999 illegal
illegal -20.3575 illegal
illegal -19.5292 illegal
illegal -14.4173 illegal
illegal -7.7350 illegal
__________ illegal __________
"""
q_values_k_100_action_west: """
__________ illegal __________
illegal -76.4639 illegal
illegal -77.1949 illegal
illegal -77.5016 illegal
illegal -77.4875 illegal
illegal -77.0702 illegal
__________ illegal __________
"""
policy: """
__________ exit __________
exit north exit
exit north exit
exit north exit
exit south exit
exit south exit
__________ exit __________
"""
actions: """
north
east
exit
south
west
"""