Answer project 3 question 3.

This commit is contained in:
2021-12-01 19:14:32 -05:00
parent d1a4735c5a
commit 8ba1f91f9b

View File

@@ -20,44 +20,45 @@
# value iteration. # value iteration.
def question2(): def question2():
"""
Changing the discount value doesn't change the behavior of the agent because
falling down cause too high of a penalty. Changing the noise to only one percent
failure (noise=0.01) makese it safe enough to cross the bridge even with 0.8
discount factor.
"""
answerDiscount = 0.9 answerDiscount = 0.9
answerNoise = 0.2 answerNoise = 0.01
return answerDiscount, answerNoise return answerDiscount, answerNoise
def question3a(): def question3a():
answerDiscount = None answerDiscount = 0.2
answerNoise = None answerNoise = 0
answerLivingReward = None answerLivingReward = 0
return answerDiscount, answerNoise, answerLivingReward return answerDiscount, answerNoise, answerLivingReward
# If not possible, return 'NOT POSSIBLE'
def question3b(): def question3b():
answerDiscount = None answerDiscount = 0.31622776601683794
answerNoise = None answerNoise = 0.2
answerLivingReward = None answerLivingReward = 0
return answerDiscount, answerNoise, answerLivingReward return answerDiscount, answerNoise, answerLivingReward
# If not possible, return 'NOT POSSIBLE'
def question3c(): def question3c():
answerDiscount = None answerDiscount = 0.9
answerNoise = None answerNoise = 0
answerLivingReward = None answerLivingReward = 0
return answerDiscount, answerNoise, answerLivingReward return answerDiscount, answerNoise, answerLivingReward
# If not possible, return 'NOT POSSIBLE'
def question3d(): def question3d():
answerDiscount = None answerDiscount = 0.9
answerNoise = None answerNoise = 0.2
answerLivingReward = None answerLivingReward = 0
return answerDiscount, answerNoise, answerLivingReward return answerDiscount, answerNoise, answerLivingReward
# If not possible, return 'NOT POSSIBLE'
def question3e(): def question3e():
answerDiscount = None answerDiscount = 0
answerNoise = None answerNoise = 0
answerLivingReward = None answerLivingReward = 1
return answerDiscount, answerNoise, answerLivingReward return answerDiscount, answerNoise, answerLivingReward
# If not possible, return 'NOT POSSIBLE'
def question6(): def question6():
answerEpsilon = None answerEpsilon = None