Add UnsuperLearnTrainWeight to train new weight kernel

2019-09-02 19:28:04 +08:00 · 2019-09-02 19:28:04 +08:00 · 6201163e14
parent d4a22775d4
commit 6201163e14
10 changed files with 127 additions and 209 deletions
--- a/FilterEvaluator/Evaluator.py
+++ b/FilterEvaluator/Evaluator.py
@ -53,32 +53,8 @@ model = utils.LoadModel(model, CurrentPath+"/checkpoint.pkl")
 # traindata, testdata = Loader.RandomMnist(batchsize, style="VerticalOneLine")
 # traindata, testdata = Loader.RandomMnist(batchsize, style="VerticalZebra")
 # traindata, testdata = Loader.Cifar10Mono(batchsize)
-traindata, testdata = Loader.Cifar10Mono(batchsize, num_workers=0, shuffle=True)
+traindata, testdata = Loader.Cifar10Mono(batchsize, num_workers=2, shuffle=True)

-def ConvKernelToImage(model, layer, foldname):
-    if not os.path.exists(foldname):
-        os.mkdir(foldname)
-    a2 = model.features[layer].weight.data
-    a2 = a2.cpu().detach().numpy().reshape((-1, a2.shape[-2], a2.shape[-1]))
-    for i in range(a2.shape[0]):
-        d = a2[i]
-        dmin = np.min(d)
-        dmax = np.max(d)
-        d = (d - dmin)*255.0/(dmax-dmin)
-        d = d.astype(int)
-        cv2.imwrite(foldname+"/"+str(i)+".png", d)
-
-def ConvKernelToImage(numpydate, foldname):
-    if not os.path.exists(foldname):
-        os.mkdir(foldname)
-    a2 = numpydate.reshape((-1, numpydate.shape[-2], numpydate.shape[-1]))
-    for i in range(a2.shape[0]):
-        d = a2[i]
-        dmin = np.min(d)
-        dmax = np.max(d)
-        d = (d - dmin)*255.0/(dmax-dmin)
-        d = d.astype(int)
-        cv2.imwrite(foldname+"/"+str(i)+".png", d)


 def GetScore(netmodel,layer,SearchLayer,DataSet,Interation=-1):
@ -175,7 +151,7 @@ def TrainLayer(netmodel, layer, SearchLayer, DataSet, Epoch=100):
        print("  epoch :" + str(e))
    return SearchLayer.weight.data.cpu().detach().numpy()

-def UnsuperLearnTrainWeight(model, layer, dataloader, NumTrain=500, TrainChannelRatio=1, Epoch=100):
+def UnsuperLearnTrainWeight(model, layer, dataloader, NumTrain=500, TrainChannelRatio=1, Epoch=20):
    tl = model.features[layer]
    newlayer = nn.Conv2d(tl.in_channels, tl.out_channels * TrainChannelRatio, tl.kernel_size,
                         tl.stride, tl.padding, tl.dilation, tl.groups, tl.bias, tl.padding_mode)
@ -203,6 +179,6 @@ np.save("WeightTrain.npy", weight)



-ConvKernelToImage(weight, CurrentPath+"image")
+utils.NumpyToImage(weight, CurrentPath+"image")
 # utils.SaveModel(model,CurrentPath+"/checkpoint.pkl")
 print("save model sucess")
--- a/FilterEvaluator/EvaluatorEntropy.py
+++ b/FilterEvaluator/EvaluatorEntropy.py
@ -47,16 +47,24 @@ model = utils.LoadModel(model, CurrentPath+"/checkpoint.pkl")



+
 # traindata, testdata = Loader.MNIST(batchsize)
 # traindata, testdata = Loader.RandomMnist(batchsize, style="Vertical")
 # traindata, testdata = Loader.RandomMnist(batchsize, style="Horizontal")
 # traindata, testdata = Loader.RandomMnist(batchsize, style="VerticalOneLine")
 # traindata, testdata = Loader.RandomMnist(batchsize, style="VerticalZebra")
 # traindata, testdata = Loader.Cifar10Mono(batchsize)
-traindata, testdata = Loader.Cifar10Mono(batchsize, num_workers=0, shuffle=True)
+traindata, testdata = Loader.Cifar10Mono(batchsize, num_workers=2, shuffle=True)


-def GetSample(netmodel,layer,SearchLayer,DataSet,Interation=-1):
+
+
+
+
+
+
+
+def GetScore(netmodel,layer,SearchLayer,DataSet,Interation=-1):
    netmodel.eval()
    sample = utils.SetDevice(torch.empty((SearchLayer.out_channels,0)))

@ -92,21 +100,7 @@ def GetSample(netmodel,layer,SearchLayer,DataSet,Interation=-1):
    dat2 = torch.mean(dat2 * dat2,dim=1)
    return dat2.cpu().detach().numpy()

-def ConvKernelToImage(model, layer, foldname):
-    if not os.path.exists(foldname):
-        os.mkdir(foldname)
-    a2 = model.features[layer].weight.data
-    a2 = a2.cpu().detach().numpy().reshape((-1, a2.shape[-2], a2.shape[-1]))
-    for i in range(a2.shape[0]):
-        d = a2[i]
-        dmin = np.min(d)
-        dmax = np.max(d)
-        d = (d - dmin)*255.0/(dmax-dmin)
-        d = d.astype(int)
-        cv2.imwrite(foldname+"/"+str(i)+".png", d)
-
-
-def UnsuperLearnConvWeight(model, layer, dataloader, NumSearch=10000, SaveChannelRatio=500, SearchChannelRatio=1, Interation=10):
+def UnsuperLearnSearchWeight(model, layer, dataloader, NumSearch=10000, SaveChannelRatio=500, SearchChannelRatio=1, Interation=10):
    tl = model.features[layer]
    newlayer = nn.Conv2d(tl.in_channels, tl.out_channels * SearchChannelRatio, tl.kernel_size,
                         tl.stride, tl.padding, tl.dilation, tl.groups, tl.bias, tl.padding_mode)
@ -122,7 +116,7 @@ def UnsuperLearnConvWeight(model, layer, dataloader, NumSearch=10000, SaveChanne
        newweight = np.random.uniform(-1.0,1.0,newweightshape).astype("float32")
        newlayer.weight.data=utils.SetDevice(torch.from_numpy(newweight))

-        score = GetSample(model, layer, newlayer, dataloader, Interation)
+        score = GetScore(model, layer, newlayer, dataloader, Interation)

        minactive = np.append(minactive, score)
        minweight = np.concatenate((minweight, newweight))
@ -139,16 +133,77 @@ def UnsuperLearnConvWeight(model, layer, dataloader, NumSearch=10000, SaveChanne
    return minweight


-weight = UnsuperLearnConvWeight(model, layer, traindata, NumSearch=100000, SearchChannelRatio=8, Interation=10)
-np.save("weight.npy", weight)
+def TrainLayer(netmodel, layer, SearchLayer, DataSet, Epoch=100):
+    netmodel.eval()
+    sample = utils.SetDevice(torch.empty((SearchLayer.out_channels,0)))
+    layer = layer-1
+    SearchLayer.weight.data.requires_grad=True
+    optimizer = optim.SGD(SearchLayer.parameters(), lr=0.1)
+    for e in range(Epoch):
+        for batch_idx, (data, target) in enumerate(DataSet):
+            optimizer.zero_grad()
+            data = utils.SetDevice(data)
+            target = utils.SetDevice(target)
+            output = netmodel.ForwardLayer(data,layer)
+            output = SearchLayer(output)
+            sample = torch.reshape(output.transpose(0,1),(SearchLayer.out_channels,-1))
+            sample_mean=torch.mean(sample,dim=1,keepdim=True)
+            dat1 = torch.mean(torch.abs(sample - sample_mean),dim=1,keepdim=True)
+            dat2 = (sample - sample_mean)/dat1
+            dat2 = torch.mean(dat2 * dat2,dim=1)
+            label = dat2*0.5
+            loss = F.l1_loss(dat2, label)
+            loss.backward()
+            optimizer.step()
+        print("  epoch :" + str(e))
+    return SearchLayer.weight.data.cpu().detach().numpy()

-ConvKernelToImage(model, layer, CurrentPath+"image")
-utils.SaveModel(model,CurrentPath+"/checkpoint.pkl")
+def UnsuperLearnTrainWeight(model, layer, dataloader, NumTrain=500, TrainChannelRatio=1, Epoch=20):
+    tl = model.features[layer]
+    newlayer = nn.Conv2d(tl.in_channels, tl.out_channels * TrainChannelRatio, tl.kernel_size,
+                         tl.stride, tl.padding, tl.dilation, tl.groups, tl.bias, tl.padding_mode)
+    newlayer = utils.SetDevice(newlayer)
+    newweightshape = list(newlayer.weight.data.shape)
+    minactive = np.empty((0))
+    minweight = np.empty([0,newweightshape[1],newweightshape[2],newweightshape[3]])
+    for i in range(NumTrain):
+        newweight = np.random.uniform(-1.0,1.0,newweightshape).astype("float32")
+        newlayer.weight.data=utils.SetDevice(torch.from_numpy(newweight))
+        newweight = TrainLayer(model, layer, newlayer, dataloader, Epoch)
+        minweight = np.concatenate((minweight, newweight))
+        print("search :" + str(i))
+    return minweight
+
+
+
+
+
+
+
+
+weight = np.load(CurrentPath+"WeightSearch.npy")
+# weight = np.zeros((990,3,3));
+# weight[:,1]=100
+# weight[:,:,1]=100
+utils.NumpyToImage(weight,CurrentPath+"image")
+
+a=0
+
+
+
+
+
+
+
+
+# weight = UnsuperLearnSearchWeight(model, layer, traindata, NumSearch=100000, SearchChannelRatio=8, Interation=10)
+# np.save("WeightSearch.npy", weight)
+
+weight = UnsuperLearnTrainWeight(model, layer, traindata)
+np.save("WeightTrain.npy", weight)
+
+
+
+ConvKernelToImage(weight, CurrentPath+"image")
+# utils.SaveModel(model,CurrentPath+"/checkpoint.pkl")
 print("save model sucess")
-
-
-
-
-
-
-weight =  np.load("weight.npy")
--- a/FilterEvaluator/EvaluatorGrad.py
+++ b/FilterEvaluator/EvaluatorGrad.py
@ -1,153 +0,0 @@
-from __future__ import print_function
-import os
-import sys
-
-import torch
-import torch.nn as nn
-import torch.nn.functional as F
-import torch.optim as optim
-import torchvision
-from torchvision import datasets, transforms
-import torchvision.models as models
-import matplotlib.pyplot as plt
-import numpy as np
-from torch.utils.data import Dataset, DataLoader
-from PIL import Image
-import random
-import cv2
-
-
-CurrentPath = os.path.split(os.path.realpath(__file__))[0]+"/"
-print("Current Path :" + CurrentPath)
-
-sys.path.append(CurrentPath+'../tools')
-sys.path.append(CurrentPath+'../')
-
-import Model as Model
-from tools import utils, Train, Loader
-
-batchsize = 128
-
-
-# model = utils.SetDevice(Model.Net5Grad35())
-# model = utils.SetDevice(Model.Net31535())
-model = utils.SetDevice(Model.Net3Grad335())
-# model = utils.SetDevice(Model.Net3())
-
-
-layers = model.PrintLayer()
-layer = 0
-
-model = utils.LoadModel(model, CurrentPath+"/checkpoint.pkl")
-
-
-
-
-
-# traindata, testdata = Loader.MNIST(batchsize)
-# traindata, testdata = Loader.RandomMnist(batchsize, style="Vertical")
-# traindata, testdata = Loader.RandomMnist(batchsize, style="Horizontal")
-# traindata, testdata = Loader.RandomMnist(batchsize, style="VerticalOneLine")
-# traindata, testdata = Loader.RandomMnist(batchsize, style="VerticalZebra")
-# traindata, testdata = Loader.Cifar10Mono(batchsize)
-traindata, testdata = Loader.Cifar10Mono(batchsize, num_workers=0, shuffle=True)
-
-
-
-
-
-
-
-
-
-
-# k = np.ones((3,3)).astype("float32")*1.0
-# d = np.ones((3,3)).astype("float32")*3.0
-# l = np.ones((3,3)).astype("float32")*3.5
-
-# k = torch.from_numpy(k)
-# d = torch.from_numpy(d)
-# l = torch.from_numpy(l)
-
-# k.requires_grad=True
-
-# optimizer = optim.SGD([k], lr=0.1)
-# optimizer.zero_grad()
-
-
-# output = k + d
-
-# loss = F.l1_loss(output, l)
-# loss.backward()
-# optimizer.step()
-
-
-
-def ConvKernelToImage(numpydate, foldname):
-    if not os.path.exists(foldname):
-        os.mkdir(foldname)
-    a2 = numpydate.reshape((-1, numpydate.shape[-2], numpydate.shape[-1]))
-    for i in range(a2.shape[0]):
-        d = a2[i]
-        dmin = np.min(d)
-        dmax = np.max(d)
-        d = (d - dmin)*255.0/(dmax-dmin)
-        d = d.astype(int)
-        cv2.imwrite(foldname+"/"+str(i)+".png", d)
-
-
-
-def TrainLayer(netmodel, layer, SearchLayer, DataSet, Epoch=100):
-    netmodel.eval()
-    sample = utils.SetDevice(torch.empty((SearchLayer.out_channels,0)))
-    layer = layer-1
-    SearchLayer.weight.data.requires_grad=True
-    optimizer = optim.SGD(SearchLayer.parameters(), lr=0.1)
-    for e in range(Epoch):
-        for batch_idx, (data, target) in enumerate(DataSet):
-            optimizer.zero_grad()
-            data = utils.SetDevice(data)
-            target = utils.SetDevice(target)
-            output = netmodel.ForwardLayer(data,layer)
-            output = SearchLayer(output)
-            sample = torch.reshape(output.transpose(0,1),(SearchLayer.out_channels,-1))
-            sample_mean=torch.mean(sample,dim=1,keepdim=True)
-            dat1 = torch.mean(torch.abs(sample - sample_mean),dim=1,keepdim=True)
-            dat2 = (sample - sample_mean)/dat1
-            dat2 = torch.mean(dat2 * dat2,dim=1)
-            label = dat2*0.5
-            loss = F.l1_loss(dat2, label)
-            loss.backward()
-            optimizer.step()
-        print("  epoch :" + str(e))
-    return SearchLayer.weight.data.cpu().detach().numpy()
-
-def UnsuperLearnTrainWeight(model, layer, dataloader, NumTrain=500, TrainChannelRatio=1, Epoch=100):
-    tl = model.features[layer]
-    newlayer = nn.Conv2d(tl.in_channels, tl.out_channels * TrainChannelRatio, tl.kernel_size,
-                         tl.stride, tl.padding, tl.dilation, tl.groups, tl.bias, tl.padding_mode)
-    newlayer = utils.SetDevice(newlayer)
-
-    newweightshape = list(newlayer.weight.data.shape)
-    
-    minactive = np.empty((0))
-    minweight = np.empty([0,newweightshape[1],newweightshape[2],newweightshape[3]])
-    for i in range(NumTrain):
-        newweight = np.random.uniform(-1.0,1.0,newweightshape).astype("float32")
-        newlayer.weight.data=utils.SetDevice(torch.from_numpy(newweight))
-        newweight = TrainLayer(model, layer, newlayer, dataloader, 5)
-        minweight = np.concatenate((minweight, newweight))
-
-        ConvKernelToImage(minweight, CurrentPath+"image")
-
-        print("search :" + str(i))
-
-    return minweight
-
-
-weight = UnsuperLearnTrainWeight(model, layer, traindata)
-np.save("WeightTrain.npy", weight)
-
-# ConvKernelToImage(model, layer, CurrentPath+"image")
-# utils.SaveModel(model,CurrentPath+"/checkpoint.pkl")
-print("save model sucess")
--- a/FilterEvaluator/WeightTrain.npy
+++ b/FilterEvaluator/WeightTrain.npy
--- a/FilterEvaluator/image/0-1024.png
+++ b/FilterEvaluator/image/0-1024.png
--- a/FilterEvaluator/image/1024-2048.png
+++ b/FilterEvaluator/image/1024-2048.png
--- a/FilterEvaluator/image/2048-3072.png
+++ b/FilterEvaluator/image/2048-3072.png
--- a/FilterEvaluator/image/3072-4096.png
+++ b/FilterEvaluator/image/3072-4096.png
--- a/tools/utils.py
+++ b/tools/utils.py
@ -149,3 +149,43 @@ def SetCUDAVISIBLEDEVICES(deviceid):
    print("Use GPU IDs :" + str(tuple(deviceid))[1:-1])


+
+
+def ConvKernelToImage(model, layer, foldname):
+    if not os.path.exists(foldname):
+        os.mkdir(foldname)
+    a2 = model.features[layer].weight.data
+    a2 = a2.cpu().detach().numpy().reshape((-1, a2.shape[-2], a2.shape[-1]))
+    for i in range(a2.shape[0]):
+        d = a2[i]
+        dmin = np.min(d)
+        dmax = np.max(d)
+        d = (d - dmin)*255.0/(dmax-dmin)
+        d = d.astype(int)
+        cv2.imwrite(foldname+"/"+str(i)+".png", d)
+
+def NumpyToImage(numpydate, foldname ,maxImageWidth = 128,maxImageHeight = 128):
+    if not os.path.exists(foldname):
+        os.mkdir(foldname)
+    numpydatemin = np.min(numpydate)
+    numpydatemax = np.max(numpydate)
+    numpydate = (numpydate - numpydatemin)*255.0/(numpydatemax-numpydatemin)
+    data = numpydate.reshape((-1, numpydate.shape[-2], numpydate.shape[-1]))
+    datashape = data.shape
+
+    newdata = np.ones((datashape[0],datashape[1]+1,datashape[2]+1))*numpydatemin
+    newdata[:, 0:datashape[1], 0:datashape[2]]=data
+    datashape = newdata.shape
+    
+    imagecols = int(maxImageWidth/datashape[2])
+    imagerows = int(maxImageHeight/datashape[1])
+    stepimages = imagecols*imagerows
+    for i in range(0,datashape[0],stepimages):
+        d = np.zeros((stepimages,datashape[1],datashape[2]))
+        left = newdata[i:min(i+stepimages,datashape[0])]
+        d[0:left.shape[0]]=left
+        d=np.reshape(d, (imagerows, imagecols, datashape[1], datashape[2]))
+        d=np.swapaxes(d, 1, 2)
+        d=np.reshape(d, (imagerows*datashape[1],imagecols*datashape[2]))
+        d = d.astype(int)
+        cv2.imwrite(foldname+"/"+str(i)+"-"+str(i+stepimages)+".png", d)
--- a/0
+++ b/0