enter reinforcement

This commit is contained in:
2024-07-06 01:30:00 +08:00
parent f105ba0150
commit e3f8181056
116 changed files with 19698 additions and 0 deletions

View File

@ -0,0 +1,2 @@
# This is the solution file for test_cases/q2/1-question-2.1.test.
# File intentionally blank.

View File

@ -0,0 +1,31 @@
class: "GridPolicyTest"
# Function in module in analysis that returns (discount, noise)
parameterFn: "question2a"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
_ _ _ _ _
_ # _ _ _
_ # 1 # 10
S _ _ _ _
-10 -10 -10 -10 -10
"""
gridName: "discountGrid"
# Policy specification
# _ policy choice not checked
# N, E, S, W policy action must be north, east, south, west
#
policy: """
_ _ _ _ _
_ _ _ _ _
_ _ _ _ _
E E N _ _
_ _ _ _ _
"""

View File

@ -0,0 +1,2 @@
# This is the solution file for test_cases/q2/2-question-2.2.test.
# File intentionally blank.

View File

@ -0,0 +1,31 @@
class: "GridPolicyTest"
# Function in module in analysis that returns (discount, noise)
parameterFn: "question2b"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
_ _ _ _ _
_ # _ _ _
_ # 1 # 10
S _ _ _ _
-10 -10 -10 -10 -10
"""
gridName: "discountGrid"
# Policy specification
# _ policy choice not checked
# N, E, S, W policy action must be north, east, south, west
#
policy: """
E E S _ _
N _ S _ _
N _ _ _ _
N _ _ _ _
_ _ _ _ _
"""

View File

@ -0,0 +1,2 @@
# This is the solution file for test_cases/q2/3-question-2.3.test.
# File intentionally blank.

View File

@ -0,0 +1,31 @@
class: "GridPolicyTest"
# Function in module in analysis that returns (discount, noise)
parameterFn: "question2c"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
_ _ _ _ _
_ # _ _ _
_ # 1 # 10
S _ _ _ _
-10 -10 -10 -10 -10
"""
gridName: "discountGrid"
# Policy specification
# _ policy choice not checked
# N, E, S, W policy action must be north, east, south, west
#
policy: """
_ _ _ _ _
_ _ _ _ _
_ _ _ _ _
E E E E N
_ _ _ _ _
"""

View File

@ -0,0 +1,2 @@
# This is the solution file for test_cases/q2/4-question-2.4.test.
# File intentionally blank.

View File

@ -0,0 +1,36 @@
class: "GridPolicyTest"
# Function in module in analysis that returns (discount, noise)
parameterFn: "question2d"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
_ _ _ _ _
_ # _ _ _
_ # 1 # 10
S _ _ _ _
-10 -10 -10 -10 -10
"""
gridName: "discountGrid"
# Policy specification
# _ policy choice not checked
# N, E, S, W policy action must be north, east, south, west
#
policy: """
_ _ _ _ _
_ _ _ _ _
_ _ _ _ _
N _ _ _ _
_ _ _ _ _
"""
# State the most probable path must visit
# (x,y) for a particular location; (0,0) is bottom left
# TERMINAL_STATE for the terminal state
pathVisits: "(4,2)"

View File

@ -0,0 +1,2 @@
# This is the solution file for test_cases/q2/5-question-2.5.test.
# File intentionally blank.

View File

@ -0,0 +1,36 @@
class: "GridPolicyTest"
# Function in module in analysis that returns (discount, noise)
parameterFn: "question2e"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
_ _ _ _ _
_ # _ _ _
_ # 1 # 10
S _ _ _ _
-10 -10 -10 -10 -10
"""
gridName: "discountGrid"
# Policy specification
# _ policy choice not checked
# N, E, S, W policy action must be north, east, south, west
#
policy: """
_ _ _ _ _
_ _ _ _ _
_ _ _ _ _
_ _ _ _ _
_ _ _ _ _
"""
# State the most probable path must not visit
# (x,y) for a particular location; (0,0) is bottom left
# TERMINAL_STATE for the terminal state
pathNotVisits: "TERMINAL_STATE"

View File

@ -0,0 +1,2 @@
max_points: "5"
class: "NumberPassedQuestion"