enter reinforcement

2024-07-06 01:30:00 +08:00
parent f105ba0150
commit e3f8181056
116 changed files with 19698 additions and 0 deletions
--- a/reinforcement/test_cases/q2/1-question-2.1.solution
+++ b/reinforcement/test_cases/q2/1-question-2.1.solution
@@ -0,0 +1,2 @@
+# This is the solution file for test_cases/q2/1-question-2.1.test.
+# File intentionally blank.
--- a/reinforcement/test_cases/q2/1-question-2.1.test
+++ b/reinforcement/test_cases/q2/1-question-2.1.test
@@ -0,0 +1,31 @@
+class: "GridPolicyTest"
+
+# Function in module in analysis that returns (discount, noise)
+parameterFn: "question2a"
+
+# GridWorld specification
+#    _ is empty space
+#    numbers are terminal states with that value
+#    # is a wall
+#    S is a start state
+#
+grid: """
+   _    _    _    _    _  
+   _    #    _    _    _
+   _    #    1    #   10
+   S    _    _    _    _
+ -10  -10  -10  -10  -10
+"""
+gridName: "discountGrid"
+
+# Policy specification
+#    _ 			policy choice not checked
+#    N, E, S, W policy action must be north, east, south, west
+#
+policy: """
+   _    _    _    _    _  
+   _    _    _    _    _  
+   _    _    _    _    _  
+   E    E    N    _    _  
+   _    _    _    _    _  
+"""
--- a/reinforcement/test_cases/q2/2-question-2.2.solution
+++ b/reinforcement/test_cases/q2/2-question-2.2.solution
@@ -0,0 +1,2 @@
+# This is the solution file for test_cases/q2/2-question-2.2.test.
+# File intentionally blank.
--- a/reinforcement/test_cases/q2/2-question-2.2.test
+++ b/reinforcement/test_cases/q2/2-question-2.2.test
@@ -0,0 +1,31 @@
+class: "GridPolicyTest"
+
+# Function in module in analysis that returns (discount, noise)
+parameterFn: "question2b"
+
+# GridWorld specification
+#    _ is empty space
+#    numbers are terminal states with that value
+#    # is a wall
+#    S is a start state
+#
+grid: """
+   _    _    _    _    _  
+   _    #    _    _    _
+   _    #    1    #   10
+   S    _    _    _    _
+ -10  -10  -10  -10  -10
+"""
+gridName: "discountGrid"
+
+# Policy specification
+#    _ 			policy choice not checked
+#    N, E, S, W policy action must be north, east, south, west
+#
+policy: """
+   E    E    S    _    _  
+   N    _    S    _    _  
+   N    _    _    _    _  
+   N    _    _    _    _  
+   _    _    _    _    _  
+"""
--- a/reinforcement/test_cases/q2/3-question-2.3.solution
+++ b/reinforcement/test_cases/q2/3-question-2.3.solution
@@ -0,0 +1,2 @@
+# This is the solution file for test_cases/q2/3-question-2.3.test.
+# File intentionally blank.
--- a/reinforcement/test_cases/q2/3-question-2.3.test
+++ b/reinforcement/test_cases/q2/3-question-2.3.test
@@ -0,0 +1,31 @@
+class: "GridPolicyTest"
+
+# Function in module in analysis that returns (discount, noise)
+parameterFn: "question2c"
+
+# GridWorld specification
+#    _ is empty space
+#    numbers are terminal states with that value
+#    # is a wall
+#    S is a start state
+#
+grid: """
+   _    _    _    _    _  
+   _    #    _    _    _
+   _    #    1    #   10
+   S    _    _    _    _
+ -10  -10  -10  -10  -10
+"""
+gridName: "discountGrid"
+
+# Policy specification
+#    _ 			policy choice not checked
+#    N, E, S, W policy action must be north, east, south, west
+#
+policy: """
+   _    _    _    _    _  
+   _    _    _    _    _  
+   _    _    _    _    _  
+   E    E    E    E    N  
+   _    _    _    _    _  
+"""
--- a/reinforcement/test_cases/q2/4-question-2.4.solution
+++ b/reinforcement/test_cases/q2/4-question-2.4.solution
@@ -0,0 +1,2 @@
+# This is the solution file for test_cases/q2/4-question-2.4.test.
+# File intentionally blank.
--- a/reinforcement/test_cases/q2/4-question-2.4.test
+++ b/reinforcement/test_cases/q2/4-question-2.4.test
@@ -0,0 +1,36 @@
+class: "GridPolicyTest"
+
+# Function in module in analysis that returns (discount, noise)
+parameterFn: "question2d"
+
+# GridWorld specification
+#    _ is empty space
+#    numbers are terminal states with that value
+#    # is a wall
+#    S is a start state
+#
+grid: """
+   _    _    _    _    _  
+   _    #    _    _    _
+   _    #    1    #   10
+   S    _    _    _    _
+ -10  -10  -10  -10  -10
+"""
+gridName: "discountGrid"
+
+# Policy specification
+#    _ 			policy choice not checked
+#    N, E, S, W policy action must be north, east, south, west
+#
+policy: """
+   _    _    _    _    _  
+   _    _    _    _    _  
+   _    _    _    _    _  
+   N    _    _    _    _  
+   _    _    _    _    _  
+"""
+
+# State the most probable path must visit
+#    (x,y) for a particular location; (0,0) is bottom left
+#    TERMINAL_STATE for the terminal state
+pathVisits: "(4,2)"
--- a/reinforcement/test_cases/q2/5-question-2.5.solution
+++ b/reinforcement/test_cases/q2/5-question-2.5.solution
@@ -0,0 +1,2 @@
+# This is the solution file for test_cases/q2/5-question-2.5.test.
+# File intentionally blank.
--- a/reinforcement/test_cases/q2/5-question-2.5.test
+++ b/reinforcement/test_cases/q2/5-question-2.5.test
@@ -0,0 +1,36 @@
+class: "GridPolicyTest"
+
+# Function in module in analysis that returns (discount, noise)
+parameterFn: "question2e"
+
+# GridWorld specification
+#    _ is empty space
+#    numbers are terminal states with that value
+#    # is a wall
+#    S is a start state
+#
+grid: """
+   _    _    _    _    _  
+   _    #    _    _    _
+   _    #    1    #   10
+   S    _    _    _    _
+ -10  -10  -10  -10  -10
+"""
+gridName: "discountGrid"
+
+# Policy specification
+#    _ 			policy choice not checked
+#    N, E, S, W policy action must be north, east, south, west
+#
+policy: """
+   _    _    _    _    _  
+   _    _    _    _    _  
+   _    _    _    _    _  
+   _    _    _    _    _
+   _    _    _    _    _  
+"""
+
+# State the most probable path must not visit
+#    (x,y) for a particular location; (0,0) is bottom left
+#    TERMINAL_STATE for the terminal state
+pathNotVisits: "TERMINAL_STATE"
--- a/reinforcement/test_cases/q2/CONFIG
+++ b/reinforcement/test_cases/q2/CONFIG
@@ -0,0 +1,2 @@
+max_points: "5"
+class: "NumberPassedQuestion"