Add model.conv1.weight normal after update grad.

2024-10-28 16:31:42 +08:00 · 2024-10-28 16:31:42 +08:00 · 5b2cd4da61
parent 6a0b47c674
commit 5b2cd4da61
2 changed files with 17 additions and 9 deletions
--- a/unsuper/.gitignore
+++ b/unsuper/.gitignore
@ -1,2 +1,4 @@
 dump1
 dump2
 *.png
 *.log
--- a/unsuper/minist.py
+++ b/unsuper/minist.py
@ -5,15 +5,23 @@ import torch.nn as nn
 import torch.nn.functional as F  # Add this line
 import torchvision
 import torchvision.transforms as transforms
 import numpy as np
 import random
 sys.path.append("..")
 from tools import show
-seed = 4321
+seed = 42
 torch.manual_seed(seed)
 if torch.cuda.is_available():
    torch.cuda.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
 np.random.seed(seed)
 random.seed(seed)
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # device = torch.device("cpu")
 # device = torch.device("mps")
 num_epochs = 1
@ -60,15 +68,12 @@ class ConvNet(nn.Module):
    def printFector(self, x, label, dir=""):
        show.DumpTensorToImage(x.view(-1, x.shape[2], x.shape[3]), dir + "/input_image.png", Contrast=[0, 1.0])
        # show.DumpTensorToLog(x, "input_image.log")
        w = self.normal_conv1_weight()
        x = torch.conv2d(x, w)
        show.DumpTensorToImage(w.view(-1, w.shape[2], w.shape[3]), dir + "/conv1_weight.png")
        # show.DumpTensorToLog(w, "conv1_weight.log")
        show.DumpTensorToImage(x.view(-1, x.shape[2], x.shape[3]), dir + "/conv1_output.png")
        # show.DumpTensorToLog(x, "conv1_output.png")
        x = self.pool(x)
        x = self.conv2(x)
@ -132,16 +137,17 @@ for epoch in range(epochs):
        model.conv1.weight.grad = None
        loss.backward()
-        model.conv1.weight.data = model.conv1.weight.data - model.conv1.weight.grad * 10000
+        model.conv1.weight.data = model.conv1.weight.data - model.conv1.weight.grad * 1000
        model.conv1.weight.data = model.normal_conv1_weight()
        if (i + 1) % 100 == 0:
            print(f"Epoch [{epoch+1}/{epochs}], Step [{i+1}/{n_total_steps}], Loss: {loss.item():.8f}")
 show.DumpTensorToImage(images.view(-1, images.shape[2], images.shape[3]), "input_image.png", Contrast=[0, 1.0])
 g = model.conv1.weight.grad
-show.DumpTensorToImage(g.view(-1, g.shape[2], g.shape[3]).cpu(), "conv1_weight_grad.png")
+show.DumpTensorToImage(g.view(-1, g.shape[2], g.shape[3]).cpu(), "conv1_weight_grad.png", Value2Log=True)
 w = model.conv1.weight.data
-show.DumpTensorToImage(w.view(-1, w.shape[2], w.shape[3]), "conv1_weight_update.png")
+show.DumpTensorToImage(w.view(-1, w.shape[2], w.shape[3]), "conv1_weight_update.png", Value2Log=True)
 # model.conv1.weight.data = torch.rand(model.conv1.weight.data.shape, device=device)