Add project 3 RL template.

This commit is contained in:
2021-11-27 10:16:51 -05:00
parent a4031888de
commit 524362c5c5
100 changed files with 16641 additions and 0 deletions

View File

@@ -0,0 +1,2 @@
# This is the solution file for test_cases/q5/1-tinygrid.test.
# File intentionally blank.

View File

@@ -0,0 +1,22 @@
class: "EpsilonGreedyTest"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
-10
S
10
"""
discount: "0.5"
noise: "0.0"
livingReward: "0.0"
epsilon: "0.5"
learningRate: "0.1"
numExperiences: "100"
valueIterations: "100"
iterations: "10000"

View File

@@ -0,0 +1,2 @@
# This is the solution file for test_cases/q5/2-tinygrid-noisy.test.
# File intentionally blank.

View File

@@ -0,0 +1,22 @@
class: "EpsilonGreedyTest"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
-10
S
10
"""
discount: "0.75"
noise: "0.25"
livingReward: "0.0"
epsilon: "0.5"
learningRate: "0.1"
numExperiences: "100"
valueIterations: "100"
iterations: "10000"

View File

@@ -0,0 +1,2 @@
# This is the solution file for test_cases/q5/3-bridge.test.
# File intentionally blank.

View File

@@ -0,0 +1,27 @@
class: "EpsilonGreedyTest"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
# 10 #
-100 _ -100
-100 _ -100
-100 _ -100
-100 _ -100
-100 S -100
# 1 #
"""
gridName: "bridgeGrid"
discount: "0.85"
noise: "0.1"
livingReward: "0.0"
epsilon: "0.5"
learningRate: "0.1"
numExperiences: "500"
valueIterations: "100"
iterations: "10000"

View File

@@ -0,0 +1,2 @@
# This is the solution file for test_cases/q5/4-discountgrid.test.
# File intentionally blank.

View File

@@ -0,0 +1,24 @@
class: "EpsilonGreedyTest"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
-10 _ 10 _ _
-10 _ # _ _
-10 _ 1 _ _
-10 _ # # _
-10 S _ _ _
"""
discount: "0.9"
noise: "0.2"
livingReward: "0.0"
epsilon: "0.2"
learningRate: "0.1"
numExperiences: "3000"
valueIterations: "100"
iterations: "10000"

View File

@@ -0,0 +1,2 @@
max_points: "3"
class: "PassAllTestsQuestion"