wait for further opt

2024-07-22 01:33:54 +08:00
parent 25f46c9a13
commit 1f217770b7
2 changed files with 4 additions and 1 deletions
--- a/reinforcement/deepQLearningAgents.py
+++ b/reinforcement/deepQLearningAgents.py
@ -73,6 +73,9 @@ class PacmanDeepQAgent(PacmanQAgent):
        else:
            print("Initializing new model parameters")
    def save_model(self, filename="para.bin"):
        if model.kProductionMode:
            print("in production mode, not saving model")
            return
        print(f"Saving model parameters to {filename}")
        torch.save({
            'model_state_dict': self.model.state_dict(),
--- a/reinforcement/model.py
+++ b/reinforcement/model.py
@ -11,7 +11,7 @@ from torch import tensor, double, optim
 from torch.nn.functional import relu, mse_loss
 import torch
-kProductionMode=True
+kProductionMode=False
 class DeepQNetwork(Module):
    """
    A model that uses a Deep Q-value Network (DQN) to approximate Q(s,a) as part