intro2ai/p3_rl/test_cases/q5/4-discountgrid.test

25 lines
463 B
Plaintext
Raw Normal View History

2021-11-27 16:16:51 +01:00
class: "EpsilonGreedyTest"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
-10 _ 10 _ _
-10 _ # _ _
-10 _ 1 _ _
-10 _ # # _
-10 S _ _ _
"""
discount: "0.9"
noise: "0.2"
livingReward: "0.0"
epsilon: "0.2"
learningRate: "0.1"
numExperiences: "3000"
valueIterations: "100"
iterations: "10000"