Files
PPCA-AIPacMan-2024/reinforcement/test_cases/q6/5-coord-extractor.test
2024-07-06 01:30:00 +08:00

26 lines
503 B
Plaintext

class: "ApproximateQLearningTest"
# GridWorld specification
# _ is empty space
# numbers are terminal states with that value
# # is a wall
# S is a start state
#
grid: """
-10 _ 10 _ _
-10 _ # _ _
-10 _ 1 _ _
-10 _ # # _
-10 S _ _ _
"""
discount: "0.9"
noise: "0.2"
livingReward: "0.0"
epsilon: "0.2"
learningRate: "0.1"
numExperiences: "3000"
valueIterations: "100"
iterations: "10000"
extractor: "CoordinateExtractor"