enter reinforcement
This commit is contained in:
2
reinforcement/test_cases/q4/1-tinygrid.solution
Normal file
2
reinforcement/test_cases/q4/1-tinygrid.solution
Normal file
@ -0,0 +1,2 @@
|
||||
# This is the solution file for test_cases/q7/1-tinygrid.test.
|
||||
# File intentionally blank.
|
22
reinforcement/test_cases/q4/1-tinygrid.test
Normal file
22
reinforcement/test_cases/q4/1-tinygrid.test
Normal file
@ -0,0 +1,22 @@
|
||||
class: "EpsilonGreedyTest"
|
||||
|
||||
# GridWorld specification
|
||||
# _ is empty space
|
||||
# numbers are terminal states with that value
|
||||
# # is a wall
|
||||
# S is a start state
|
||||
#
|
||||
grid: """
|
||||
-10
|
||||
S
|
||||
10
|
||||
"""
|
||||
discount: "0.5"
|
||||
noise: "0.0"
|
||||
livingReward: "0.0"
|
||||
epsilon: "0.5"
|
||||
learningRate: "0.1"
|
||||
numExperiences: "100"
|
||||
valueIterations: "100"
|
||||
iterations: "10000"
|
||||
|
2
reinforcement/test_cases/q4/2-tinygrid-noisy.solution
Normal file
2
reinforcement/test_cases/q4/2-tinygrid-noisy.solution
Normal file
@ -0,0 +1,2 @@
|
||||
# This is the solution file for test_cases/q7/2-tinygrid-noisy.test.
|
||||
# File intentionally blank.
|
22
reinforcement/test_cases/q4/2-tinygrid-noisy.test
Normal file
22
reinforcement/test_cases/q4/2-tinygrid-noisy.test
Normal file
@ -0,0 +1,22 @@
|
||||
class: "EpsilonGreedyTest"
|
||||
|
||||
# GridWorld specification
|
||||
# _ is empty space
|
||||
# numbers are terminal states with that value
|
||||
# # is a wall
|
||||
# S is a start state
|
||||
#
|
||||
grid: """
|
||||
-10
|
||||
S
|
||||
10
|
||||
"""
|
||||
discount: "0.75"
|
||||
noise: "0.25"
|
||||
livingReward: "0.0"
|
||||
epsilon: "0.5"
|
||||
learningRate: "0.1"
|
||||
numExperiences: "100"
|
||||
valueIterations: "100"
|
||||
iterations: "10000"
|
||||
|
2
reinforcement/test_cases/q4/3-bridge.solution
Normal file
2
reinforcement/test_cases/q4/3-bridge.solution
Normal file
@ -0,0 +1,2 @@
|
||||
# This is the solution file for test_cases/q7/3-bridge.test.
|
||||
# File intentionally blank.
|
27
reinforcement/test_cases/q4/3-bridge.test
Normal file
27
reinforcement/test_cases/q4/3-bridge.test
Normal file
@ -0,0 +1,27 @@
|
||||
class: "EpsilonGreedyTest"
|
||||
|
||||
# GridWorld specification
|
||||
# _ is empty space
|
||||
# numbers are terminal states with that value
|
||||
# # is a wall
|
||||
# S is a start state
|
||||
#
|
||||
grid: """
|
||||
# 10 #
|
||||
-100 _ -100
|
||||
-100 _ -100
|
||||
-100 _ -100
|
||||
-100 _ -100
|
||||
-100 S -100
|
||||
# 1 #
|
||||
"""
|
||||
gridName: "bridgeGrid"
|
||||
discount: "0.85"
|
||||
noise: "0.1"
|
||||
livingReward: "0.0"
|
||||
epsilon: "0.5"
|
||||
learningRate: "0.1"
|
||||
numExperiences: "500"
|
||||
valueIterations: "100"
|
||||
iterations: "10000"
|
||||
|
2
reinforcement/test_cases/q4/4-discountgrid.solution
Normal file
2
reinforcement/test_cases/q4/4-discountgrid.solution
Normal file
@ -0,0 +1,2 @@
|
||||
# This is the solution file for test_cases/q7/4-discountgrid.test.
|
||||
# File intentionally blank.
|
24
reinforcement/test_cases/q4/4-discountgrid.test
Normal file
24
reinforcement/test_cases/q4/4-discountgrid.test
Normal file
@ -0,0 +1,24 @@
|
||||
class: "EpsilonGreedyTest"
|
||||
|
||||
# GridWorld specification
|
||||
# _ is empty space
|
||||
# numbers are terminal states with that value
|
||||
# # is a wall
|
||||
# S is a start state
|
||||
#
|
||||
grid: """
|
||||
-10 _ 10 _ _
|
||||
-10 _ # _ _
|
||||
-10 _ 1 _ _
|
||||
-10 _ # # _
|
||||
-10 S _ _ _
|
||||
"""
|
||||
discount: "0.9"
|
||||
noise: "0.2"
|
||||
livingReward: "0.0"
|
||||
epsilon: "0.2"
|
||||
learningRate: "0.1"
|
||||
numExperiences: "3000"
|
||||
valueIterations: "100"
|
||||
iterations: "10000"
|
||||
|
2
reinforcement/test_cases/q4/CONFIG
Normal file
2
reinforcement/test_cases/q4/CONFIG
Normal file
@ -0,0 +1,2 @@
|
||||
max_points: "2"
|
||||
class: "PassAllTestsQuestion"
|
Reference in New Issue
Block a user