ml q3

2024-07-05 19:21:02 +08:00
parent 422beb4a9b
commit 99f53727ba
2 changed files with 57 additions and 1 deletions
--- a/machinelearning/backend.py
+++ b/machinelearning/backend.py
@ -265,7 +265,12 @@ class DigitClassificationDataset(CustomDataset):
    def get_validation_accuracy(self):
        dev_logits = self.model.run(torch.tensor(self.dev_images, dtype=torch.float32)).data
        dev_predicted = torch.argmax(dev_logits, axis=1).detach()
-        dev_accuracy = (dev_predicted == self.dev_labels).mean()
+        # print(f"dev_predicted:{dev_predicted}")
+        # print(f"self.dev_labels: {self.dev_labels}")
+        total = len(dev_predicted)
+        correct = torch.sum(torch.eq(dev_predicted.cpu(), torch.tensor(self.dev_labels))).float()
+        # dev_accuracy = (dev_predicted == self.dev_labels).mean()
+        dev_accuracy = correct / total
        return dev_accuracy

 class LanguageIDDataset(CustomDataset):
--- a/machinelearning/models.py
+++ b/machinelearning/models.py
@ -225,8 +225,36 @@ class DigitClassificationModel(Module):
        input_size = 28 * 28
        output_size = 10
        "*** YOUR CODE HERE ***"
+        hidden_layer1_size=300
+        hidden_layer2_size=300
+        hidden_layer3_size=300
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.fc1 = Linear(input_size, hidden_layer1_size).to(self.device)
+        self.fc2 = Linear(hidden_layer1_size, hidden_layer2_size).to(self.device)
+        self.fc3 = Linear(hidden_layer2_size, hidden_layer3_size).to(self.device)
+        self.fc_out = Linear(hidden_layer3_size, output_size,bias=False).to(self.device)


+    def forward(self, x):
+        """
+        Runs the model for a batch of examples.
+
+        Your model should predict a node with shape (batch_size x 10),
+        containing scores. Higher scores correspond to greater probability of
+        the image belonging to a particular class.
+
+        Inputs:
+            x: a tensor with shape (batch_size x 784)
+        Output:
+            A node with shape (batch_size x 10) containing predicted scores
+                (also called logits)
+        """
+        x=x.to(self.device)
+        x = relu(self.fc1(x))
+        x = relu(self.fc2(x))
+        x = relu(self.fc3(x))
+        x = self.fc_out(x)
+        return x

    def run(self, x):
        """
@ -243,6 +271,7 @@ class DigitClassificationModel(Module):
                (also called logits)
        """
        """ YOUR CODE HERE """
+        return self.forward(x)


    def get_loss(self, x, y):
@ -259,6 +288,7 @@ class DigitClassificationModel(Module):
        Returns: a loss tensor
        """
        """ YOUR CODE HERE """
+        return cross_entropy(self.forward(x.to(self.device)), y.to(self.device))

        

@ -267,6 +297,27 @@ class DigitClassificationModel(Module):
        Trains the model.
        """
        """ YOUR CODE HERE """
+        optimizer = torch.optim.Adam(self.parameters(), lr=0.0005)
+        dataloader = DataLoader(dataset, batch_size=20, shuffle=True)
+        max_round=15000
+        required_accuracy=0.99
+        round_cnt=0
+        while round_cnt<max_round:
+            for sample in dataloader:
+                x = sample['x'].to(self.device)
+                y = sample['label'].to(self.device)
+                loss = self.get_loss(x, y)
+                if dataset.get_validation_accuracy() > required_accuracy:
+                    break
+                optimizer.zero_grad()
+                loss.backward()
+                optimizer.step()
+                round_cnt+=1
+                if round_cnt%100==0:
+                    print(f"round: {round_cnt}, accuracy: {dataset.get_validation_accuracy()}")
+            if dataset.get_validation_accuracy() > required_accuracy:
+                break
+        print(f"round: {round_cnt}, accuracy: {dataset.get_validation_accuracy()}")