【AI】Pytorch_预训练模型

1. 模型下载

import re

import os

import glob

import torch

from torch.hub import download_url_to_file

from torch.hub import urlparse

import torchvision.models as models

def download_model(url, dst_path):

    parts = urlparse(url)

    filename = os.path.basename(parts.path)

    HASH_REGEX = re.compile(r'-([a-f0-9]*)\.')

    hash_prefix = HASH_REGEX.search(filename).group(1)

    if os.path.exists(os.path.join(dst_path, filename)):

        return filename

    download_url_to_file(url, os.path.join(dst_path, filename), hash_prefix, True)

    return filename

def saveToFolder(path):

    #其他各种模型可以在这个目录下进行搜索查看 https://github.com/pytorch/vision/tree/master/torchvision/models

    # model_urls = {

    #     'vgg11': 'https://download.pytorch.org/models/vgg11-bbd30ac9.pth',

    #     'vgg13': 'https://download.pytorch.org/models/vgg13-c768596a.pth',

    #     'vgg16': 'https://download.pytorch.org/models/vgg16-397923af.pth',

    #     'vgg19': 'https://download.pytorch.org/models/vgg19-dcbb9e9d.pth',

    #     'vgg11_bn': 'https://download.pytorch.org/models/vgg11_bn-6002323d.pth',

    #     'vgg13_bn': 'https://download.pytorch.org/models/vgg13_bn-abd245e5.pth',

    #     'vgg16_bn': 'https://download.pytorch.org/models/vgg16_bn-6c64b313.pth',

    #     'vgg19_bn': 'https://download.pytorch.org/models/vgg19_bn-c79401a0.pth',

    # }

    model_urls={

        'vgg16': 'https://download.pytorch.org/models/vgg16-397923af.pth',

    }

    if not (os.path.exists(path)):

        os.makedirs(path)

    for url in model_urls.values():

        download_model(url, path)

def load_model(model_name, model_dir):

    model  = eval('models.%s(init_weights=False)' % model_name)

    path_format = os.path.join(model_dir, '%s-[a-z0-9]*.pth' % model_name)

    model_path = glob.glob(path_format)[0]

    model.load_state_dict(torch.load(model_path))

    return model

def main():

    path = '/home/iot/jupyter/root_dir/liudongdong/pytorch_demo/pretainedpth/vgg16'

    saveToFolder(path)

    model = load_model('vgg16', path)

    print(model)

if __name__ == "__main__":

    main()

2. 模型查看

resnet.fc = torch.nn.Linear(resnet.fc.in_features, 100)

print(resnet)   #将会输出网络每一层结构

# 或者采用torchviz模块，对网络结构进行可视化， 将会生成一个pdf 网络结构图

from torchviz import make_dot

x = torch.randn(10, 3, 224, 224).requires_grad_(True)

y = resnet(x)

vis_graph = make_dot(y, params=dict(list(resnet.named_parameters()) + [('x', x)]))

vise_graph.view()

3. 模型初始化

适当的权值初始化可以加速模型的训练和模型的收敛，而错误的权值初始化会导致梯度消失/爆炸，从而无法完成网络的训练，因此需要控制网络输出值的尺度范围。torch.nn.init中提供了常用的初始化方法函数，1. Xavier，kaiming系列；2. 其他方法分布

从上图中的公式可以看出，*每传播一层，输出值数据的方差就会扩大n* *倍*，要想控制输出H的尺度范围，只需要控制H的方差为1，则无论经过多少层都可以维持在初始输入X的方差附近，因此*权重w需要初始化方差为1/n*（n为神经元的个数）**

.1. Xavier 均匀分布

import os

import torch

import random

import numpy as np

import torch.nn as nn

def set_seed(seed=1):

    random.seed(seed)

    np.random.seed(seed)

    torch.manual_seed(seed)

    torch.cuda.manual_seed(seed)

set_seed(1)  # 设置随机种子

class MLP(nn.Module):

    def __init__(self, neural_num, layers):

        super(MLP, self).__init__()

        self.linears = nn.ModuleList([nn.Linear(neural_num, neural_num, bias=False) for i in range(layers)])

        self.neural_num = neural_num

    def forward(self, x):

        for (i, linear) in enumerate(self.linears):

            x = linear(x)

            x = torch.tanh(x)

            print("layer:{}, std:{}".format(i, x.std()))

            if torch.isnan(x.std()):

                print("output is nan in {} layers".format(i))

                break

        return x

    def initialize(self):

        for m in self.modules():

            if isinstance(m, nn.Linear):

                #xavier手动计算

                a = np.sqrt(6 / (self.neural_num + self.neural_num))

                tanh_gain = nn.init.calculate_gain('tanh')         #计算增益

                a *= tanh_gain

                nn.init.uniform_(m.weight.data, -a, a)

                #调用pytorch实现xavier初始化，适用于饱和激活函数

                # tanh_gain = nn.init.calculate_gain('tanh')

                # nn.init.xavier_uniform_(m.weight.data, gain=tanh_gain)

# flag = 0

flag = 1

if flag:

    layer_nums = 100

    neural_nums = 256

    batch_size = 16

    net = MLP(neural_nums, layer_nums)

    net.initialize()

    inputs = torch.randn((batch_size, neural_nums))  # normal: mean=0, std=1

    output = net(inputs)

    print(output)

torch.nn.init.xavier_uniform_(tensor, gain=1)

xavier初始化方法中服从均匀分布U(−a,a) ，分布的参数a = gain * sqrt(6/fan_in+fan_out)，

这里有一个gain，增益的大小是依据激活函数类型来设定
eg：nn.init.xavier_uniform_(w, gain=nn.init.calculate_gain('relu'))

.2. Xavier正态分布

torch.nn.init.xavier_normal_(tensor, gain=1)

xavier初始化方法中服从正态分布，

mean=0,std = gain * sqrt(2/fan_in + fan_out)

.3. kaiming均匀分布

torch.nn.init.kaiming_uniform_(tensor, a=0, mode='fan_in', nonlinearity='leaky_relu')

此为均匀分布，U～（-bound, bound）, bound = sqrt(6/(1+a^2)*fan_in)

其中，a为激活函数的负半轴的斜率，relu是0

mode- 可选为fan_in 或 fan_out, fan_in使正向传播时，方差一致; fan_out使反向传播时，方差一致

nonlinearity- 可选 relu 和 leaky_relu ，默认值为。 leaky_relu

nn.init.kaiming_uniform_(w, mode='fan_in', nonlinearity='relu')

import os

import torch

import random

import numpy as np

import torch.nn as nn

def set_seed(seed=1):

    random.seed(seed)

    np.random.seed(seed)

    torch.manual_seed(seed)

    torch.cuda.manual_seed(seed)

set_seed(1)  # 设置随机种子

class MLP(nn.Module):

    def __init__(self, neural_num, layers):

        super(MLP, self).__init__()

        self.linears = nn.ModuleList([nn.Linear(neural_num, neural_num, bias=False) for i in range(layers)])

        self.neural_num = neural_num

    def forward(self, x):

        for (i, linear) in enumerate(self.linears):

            x = linear(x)

            x = torch.relu(x)

            print("layer:{}, std:{}".format(i, x.std()))

            if torch.isnan(x.std()):

                print("output is nan in {} layers".format(i))

                break

        return x

    def initialize(self):

        for m in self.modules():

            if isinstance(m, nn.Linear):

                #kaiming初始化手动

                nn.init.normal_(m.weight.data, std=np.sqrt(2 / self.neural_num))

                #kaiming初始化

                # nn.init.kaiming_normal_(m.weight.data)

# flag = 0

flag = 1

if flag:

    layer_nums = 100

    neural_nums = 256

    batch_size = 16

    net = MLP(neural_nums, layer_nums)

    net.initialize()

    inputs = torch.randn((batch_size, neural_nums))  # normal: mean=0, std=1

    output = net(inputs)

    print(output)

.4. kaiming 正态分布

torch.nn.init.kaiming_normal_(tensor, a=0, mode='fan_in', nonlinearity='leaky_relu')

此为0均值的正态分布，N～ (0,std)，其中std = sqrt(2/(1+a^2)*fan_in)

其中，a为激活函数的负半轴的斜率，relu是0

mode- 可选为fan_in 或 fan_out, fan_in使正向传播时，方差一致;fan_out使反向传播时，方差一致

nonlinearity- 可选 relu 和 leaky_relu ，默认值为。 leaky_relu

nn.init.kaiming_normal_(w, mode='fan_out', nonlinearity='relu')

.5. 均匀初始化分布

torch.nn.init.uniform_(tensor, a=0, b=1)

使值服从均匀分布U(a,b)

.6. 正态初始化分布

torch.nn.init.normal_(tensor, mean=0, std=1)

使值服从正态分布N(mean, std)，默认值为0，1

.7. 常数初始化

torch.nn.init.constant_(tensor, val)

使值为常数val nn.init.constant_(w, 0.3)

.8. 单位矩阵初始化

torch.nn.init.eye_(tensor)

将二维tensor初始化为单位矩阵（the identity matrix）

.9. 正交初始化

torch.nn.init.orthogonal_(tensor, gain=1)

使得tensor是正交的，论文:Exact solutions to the nonlinear dynamics of learning in deep linear neural networks” - Saxe, A. et al. (2013)

.10. 稀疏初始化

torch.nn.init.sparse_(tensor, sparsity, std=0.01)

从正态分布N～（0. std）中进行稀疏化，使每一个column有一部分为0

sparsity- 每一个column稀疏的比例，即为0的比例

nn.init.sparse_(w, sparsity=0.1)

注意 model.modules()和 model.children()的区别：model.modules()会迭代地遍历模型的所有子层，而model.children()只会遍历模型下的一层。

对网络中某一层进行初始化

self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3)

init.xavier_uniform(self.conv1.weight)

init.constant(self.conv1.bias, 0.1)

对网络整体进行初始化

def weights_init(m):

    classname=m.__class__.__name__

    if classname.find('Conv') != -1:

        xavier(m.weight.data)

        xavier(m.bias.data)

net = Net()#构建网络

net.apply(weights_init) #apply函数会递归地搜索网络内的所有module并把参数表示的函数应用到所有的module上。

 #对所有的Conv层都初始化权重.

权重初始化

# Common practise for initialization.

for layer in model.modules():

    if isinstance(layer, torch.nn.Conv2d):

        torch.nn.init.kaiming_normal_(layer.weight, mode='fan_out',

                                      nonlinearity='relu')

        if layer.bias is not None:

            torch.nn.init.constant_(layer.bias, val=0.0)

    elif isinstance(layer, torch.nn.BatchNorm2d):

        torch.nn.init.constant_(layer.weight, val=1.0)

        torch.nn.init.constant_(layer.bias, val=0.0)

    elif isinstance(layer, torch.nn.Linear):

        torch.nn.init.xavier_normal_(layer.weight)

        if layer.bias is not None:

            torch.nn.init.constant_(layer.bias, val=0.0)

# Initialization with given tensor.

layer.weight = torch.nn.Parameter(tensor)

对指定层进行Finetune

count = 0para_optim = []for k in model.children():    count += 1    # 6 should be changed properly    if count > 6:        for param in k.parameters():            para_optim.append(param)            else:                for param in k.parameters():                    param.requires_grad = Falseoptimizer = optim.RMSprop(para_optim, lr)

对固定部分参数训练

# 只有True的才训练optimizer.SGD(filter(lambda p: p.requires_grad, model.parameters()), lr=1e-3)class Net(nn.Module):    def __init__(self):        super(Net, self).__init__()        self.conv1 = nn.Conv2d(1, 6, 5)        self.conv2 = nn.Conv2d(6, 16, 5)		#前面的参数就是False，而后面的不变        for p in self.parameters():            p.requires_grad=False        self.fc1 = nn.Linear(16 * 5 * 5, 120)        self.fc2 = nn.Linear(120, 84)        self.fc3 = nn.Linear(84, 10)

优化

optimizer = optim.Adam([        {'params': [param for name, param in net.named_parameters() if name[-4:] == 'bias'],         'lr': 2 * args['lr']},        {'params': [param for name, param in net.named_parameters() if name[-4:] != 'bias'],         'lr': args['lr'], 'weight_decay': args['weight_decay']}    ], betas=(args['momentum'], 0.999))

加载部分权重

# 获得模型的键值keys=[]for k,v in desnet.state_dict().items():    if v.shape:        keys.append(k)    print(k,v.shape)  # 从预训练文件中加载权重state={}pretrained_dict = torch.load('/home/lulu/pytorch/Paper_Code/weights/densenet121-a639ec97.pth')for i,(k,v) in enumerate(pretrained_dict.items()):    if 'classifier' not in k:        state[keys[i]] = v# 保存权重torch.save(state,'/home/lulu/pytorch/Paper_Code/weights/densenet121.pth')

4. 构建模型

Sequential：顺序性，各网络层之间严格按照顺序执行，常用语block构建

ModuleList：迭代性，常用于大量重复网络构建，通过for循环实现重复构建

ModuleDict：索引性，常用于可选择的网络层

.1. nn.Sequential

# ============================ Sequentialclass LeNetSequential(nn.Module):    def __init__(self, classes):        super(LeNetSequential, self).__init__()        self.features = nn.Sequential(            nn.Conv2d(3, 6, 5),            nn.ReLU(),            nn.MaxPool2d(kernel_size=2, stride=2),            nn.Conv2d(6, 16, 5),            nn.ReLU(),            nn.MaxPool2d(kernel_size=2, stride=2),)         self.classifier = nn.Sequential(            nn.Linear(16*5*5, 120),            nn.ReLU(),            nn.Linear(120, 84),            nn.ReLU(),            nn.Linear(84, classes),)     def forward(self, x):        x = self.features(x)        x = x.view(x.size()[0], -1)        x = self.classifier(x)        return x

.2. nn.ModuleList

功能：像python的**list**一样包装多个网络层，以迭代的方式调用网络层

append（）：在modulelist后面添加网络层

extend（）：拼接两个modulelist

insert（）：在modulelist中指定位置插入网络层

class ModuleList(nn.Module):    def __init__(self):        super(ModuleList, self).__init__()        self.linears = nn.ModuleList([nn.Linear(10, 10) for i in range(20)])    def forward(self, x):        for i, linear in enumerate(self.linears):            x = linear(x)        return xnet = ModuleList()print(net)fake_data = torch.ones((10, 10))output = net(fake_data)print(output)

.3. nn.ModuleDict

功能：像python的dict一样包装多个网络层（每一个给一个key，可通过key索引网络层）

clear（）：清空moduleDict

items（）：返回可迭代的键值对（key-value pairs）

keys（）：返回字典的key

values（）：返回字典的value

pop（）：返回一对键值，并从字典中删除

# ============================ ModuleDictclass ModuleDict(nn.Module):    def __init__(self):        super(ModuleDict, self).__init__()        self.choices = nn.ModuleDict({            'conv': nn.Conv2d(10, 10, 3),            'pool': nn.MaxPool2d(3)        })        self.activations = nn.ModuleDict({            'relu': nn.ReLU(),            'prelu': nn.PReLU()        })    def forward(self, x, choice, act):        x = self.choices[choice](x)        x = self.activations[act](x)        return xnet = ModuleDict()fake_img = torch.randn((4, 10, 32, 32))output = net(fake_img, 'conv', 'relu')#prelu输出结果有负值，改为relu后输出没有负数，可以检查是不是按照我们的想法运行的print(output)

5. 使用预训练模型

.0. AlexNet 预训练模型修改

1. 直接使用AlexNet，并添加可视化

import osimport torchimport torch.nnimport torchvision.models as modelsimport torchvision.transforms as transformsimport torch.nn.functional as F import torchvision.utils as utilsimport cv2 import matplotlib.pyplot as pltimport numpy as np from PIL import Imageimport argparse"""input commands"""paser = argparse.ArgumentParser()paser.add_argument("--test_img", type=str, default='whippet.jpg', help="testing image")opt = paser.parse_args()# function for visualizing the feature mapsdef visualize_activation_maps(input, model):    I = utils.make_grid(input, nrow=1, normalize=True, scale_each=True)    img = I.permute((1, 2, 0)).cpu().numpy()    conv_results = []    x = input    for idx, operation in enumerate(model.features):        x = operation(x)        if idx in {1, 4, 7, 9, 11}:            conv_results.append(x)        for i in range(5):        conv_result = conv_results[i]        N, C, H, W = conv_result.size()        mean_acti_map = torch.mean(conv_result, 1, True)        mean_acti_map = F.interpolate(mean_acti_map, size=[224,224], mode='bilinear', align_corners=False)        map_grid = utils.make_grid(mean_acti_map, nrow=1, normalize=True, scale_each=True)        map_grid = map_grid.permute((1, 2, 0)).mul(255).byte().cpu().numpy()        map_grid = cv2.applyColorMap(map_grid, cv2.COLORMAP_JET)        map_grid = cv2.cvtColor(map_grid, cv2.COLOR_BGR2RGB)        map_grid = np.float32(map_grid) / 255        visual_acti_map = 0.6 * img + 0.4 * map_grid        tensor_visual_acti_map = torch.from_numpy(visual_acti_map).permute(2, 0, 1)        file_name_visual_acti_map = 'conv{}_activation_map.jpg'.format(i+1)        utils.save_image(tensor_visual_acti_map, file_name_visual_acti_map)    return 0# main if __name__ == "__main__":    """    data transforms, for pre-processing the input testing image before feeding into the net    """    data_transforms = transforms.Compose([        transforms.Resize((224,224)),             # resize the input to 224x224        transforms.ToTensor(),              # put the input to tensor format        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])  # normalize the input        # the normalization is based on images from ImageNet    ])    # obtain the file path of the testing image    test_image_dir = './alexnet_images'    test_image_filepath = os.path.join(test_image_dir, opt.test_img)    #print(test_image_filepath)    # open the testing image    img = Image.open(test_image_filepath)    print("original image's shape: " + str(img.size))    # pre-process the input    transformed_img = data_transforms(img)    print("transformed image's shape: " + str(transformed_img.shape))    # form a batch with only one image    batch_img = torch.unsqueeze(transformed_img, 0)  #Returns a new tensor with a dimension of size one inserted at the specified position.    print("image batch's shape: " + str(batch_img.shape))    # load pre-trained AlexNet model    print("\nfeed the input into the pre-trained alexnet to get the output")    alexnet = models.alexnet(pretrained=True)    # put the model to eval mode for testing    alexnet.eval()    # obtain the output of the model    output = alexnet(batch_img)    print("output vector's shape: " + str(output.shape))        # obtain the activation maps    visualize_activation_maps(batch_img, alexnet)    # map the class no. to the corresponding label    with open('class_names_ImageNet.txt') as labels:        classes = [i.strip() for i in labels.readlines()]        # print the first 5 classes to see the labels    print("\nprint the first 5 classes to see the lables")    for i in range(5):        print("class " + str(i) + ": " + str(classes[i]))        # sort the probability vector in descending order    sorted, indices = torch.sort(output, descending=True)    percentage = F.softmax(output, dim=1)[0] * 100.0    # obtain the first 5 classes (with the highest probability) the input belongs to    results = [(classes[i], percentage[i].item()) for i in indices[0][:5]]    print("\nprint the first 5 classes the testing image belongs to")    for i in range(5):        print('{}: {:.4f}%'.format(results[i][0], results[i][1]))

2. 修改Alexnet最后一层

import torchvision.models as modelsmodel = models.AlexNet()print(model)#修改网络的第一个卷积层的输入为4通道，输出的结果预测为10个类别model.features[0]=nn.Conv2d(4, 64, kernel_size=(11, 11), stride=(4, 4), padding=(2, 2))model.classifier[6] = nn.Linear(4096,10)print(model)

model = cifar10_cnn.CIFAR10_Nettest()pretrained_dict = torch.load('models/cifar10_statedict.pkl')model_dict = model.state_dict()pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model_dict}model_dict.update(pretrained_dict)model.load_state_dict(model_dict)print(model)new_model_dict = model.state_dict()dict_name = list(new_model_dict)for i, p in enumerate(dict_name):    print(i, p)print('before change:\n',new_model_dict['classifier.5.bias'])model.classifier[5]=nn.Linear(1024,17)change_model_dict = model.state_dict()new_dict_name = list(change_model_dict)print('after change:\n',change_model_dict['classifier.5.bias'])

import torch.nn as nnfrom torchvision import modelsclass BuildAlexNet(nn.Module):    def __init__(self, model_type, n_output):        super(BuildAlexNet, self).__init__()        self.model_type = model_type        if model_type == 'pre':            model = models.alexnet(pretrained=True)            self.features = model.features            fc1 = nn.Linear(9216, 4096)            fc1.bias = model.classifier[1].bias            fc1.weight = model.classifier[1].weight                        fc2 = nn.Linear(4096, 4096)            fc2.bias = model.classifier[4].bias            fc2.weight = model.classifier[4].weight                        self.classifier = nn.Sequential(                    nn.Dropout(),                    fc1,                    nn.ReLU(inplace=True),                    nn.Dropout(),                    fc2,                    nn.ReLU(inplace=True),                    nn.Linear(4096, n_output))              # #            model.classifier[6]==nn.Linear(4096,n_output)#            self.classifier = model.classifier        if model_type == 'new':            self.features = nn.Sequential(                    nn.Conv2d(3, 64, 11, 4, 2),                    nn.ReLU(inplace = True),                    nn.MaxPool2d(3, 2, 0),                    nn.Conv2d(64, 192, 5, 1, 2),                    nn.ReLU(inplace=True),                    nn.MaxPool2d(3, 2, 0),                    nn.Conv2d(192, 384, 3, 1, 1),                    nn.ReLU(inplace = True),                    nn.Conv2d(384, 256, 3, 1, 1),                    nn.ReLU(inplace=True),                    nn.MaxPool2d(3, 2, 0))            self.classifier = nn.Sequential(                    nn.Dropout(),                    nn.Linear(9216, 4096),                    nn.ReLU(inplace=True),                    nn.Dropout(),                    nn.Linear(4096, 4096),                    nn.ReLU(inplace=True),                    nn.Linear(4096, n_output))                def forward(self, x):        x = self.features(x)        x = x.view(x.size(0), -1)        out  = self.classifier(x)        return out

import numpy as npfrom torch.autograd import Variableimport torchif __name__ == '__main__':    model_type = 'pre'    n_output = 10    alexnet = BuildAlexNet(model_type, n_output)    print(alexnet)        x = np.random.rand(1,3,224,224)    x = x.astype(np.float32)    x_ts = torch.from_numpy(x)    x_in = Variable(x_ts)    y = alexnet(x_in)

.1. ResNet参数修改

resnet网络最后一层分类层fc是对1000种类型进行划分，对于自己的数据集，如果只有9类

# coding=UTF-8import torchvision.models as models#调用模型model = models.resnet50(pretrained=True)#提取fc层中固定的参数fc_features = model.fc.in_features#修改类别为9model.fc = nn.Linear(fc_features, 9)

.2. 增减卷积层

1、先建立好自己的网络（与预训练的模型类似，要不谈何fine-tune）

2、然后将预训练模型参数与自己搭建的网络不一致的部分参数去掉

3、将保留的合适的参数读入网络初始化，实现fine-tune的效果

# -*- coding:utf-8 -*-######################建立自己的网络模型net########################然后读出预训练模型参数以resnet152为例，我不是利用程序下载的，我是习惯了下载好存储在文件夹中pretrained_dict = torch.load(save_path)model_dict = net.state_dict()   #(读出搭建的网络的参数，以便后边更新之后初始化）####去除不属于model_dict的键值pretrained_dict={ k : v for k, v in pretrained_dict.items() if k in model_dict}###更新现有的model_dict的值model_dict.update(pretrained_dict)##加载模型需要的参数net.load_state_dict(model_dict)

.3. ImageNet计算多层卷积特征

class FeatureExtractor(torch.nn.Module):    """Helper class to extract several convolution features from the given    pre-trained model.    Attributes:        _model, torch.nn.Module.        _layers_to_extract, list<str> or set<str>    Example:        >>> model = torchvision.models.resnet152(pretrained=True)        >>> model = torch.nn.Sequential(collections.OrderedDict(                list(model.named_children())[:-1]))        >>> conv_representation = FeatureExtractor(                pretrained_model=model,                layers_to_extract={'layer1', 'layer2', 'layer3', 'layer4'})(image)    """    def __init__(self, pretrained_model, layers_to_extract):        torch.nn.Module.__init__(self)        self._model = pretrained_model        self._model.eval()        self._layers_to_extract = set(layers_to_extract)        def forward(self, x):        with torch.no_grad():            conv_representation = []            for name, layer in self._model.named_children():                x = layer(x)                if name in self._layers_to_extract:                    conv_representation.append(x)            return conv_representation

4. 训练特定层，冻结其它层

将模型起始的一些层的权重保持不变，重新训练后面的层，得到新的权重。在这个过程中，可多次进行尝试，从而能够依据结果找到 frozen layers 和 retrain layers 之间的最佳搭配。如何使用预训练模型，是由数据集大小和新旧数据集(预训练的数据集和自己要解决的数据集)之间数据的相似度来决定的。

requires_grad为False来冻结网络参数

filter(lambda p: p.requires_grad, model.parameters())过滤掉requires_grad=false的层

#首先自己新定义一个网络class CNN(nn.Module):    def __init__(self, block, layers, num_classes=9):         #自己新定义的CNN与继承的ResNet网络结构大体相同，即除了新增层，其他层的层名与ResNet的相同。        self.inplanes = 64         super(ResNet, self).__init__() #继承ResNet网络结构        self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3, bias=False)         self.bn1 = nn.BatchNorm2d(64)         self.relu = nn.ReLU(inplace=True)         self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)         self.layer1 = self._make_layer(block, 64, layers[0])         self.layer2 = self._make_layer(block, 128, layers[1], stride=2)         self.layer3 = self._make_layer(block, 256, layers[2], stride=2)         self.layer4 = self._make_layer(block, 512, layers[3], stride=2)         self.avgpool = nn.AvgPool2d(7, stride=1)        #新增一个反卷积层         self.convtranspose1 = nn.ConvTranspose2d(2048, 2048, kernel_size=3, stride=1, padding=1, output_padding=0, groups=1, bias=False, dilation=1)         #新增一个最大池化层         self.maxpool2 = nn.MaxPool2d(kernel_size=3, stride=1, padding=1)         #将原来的fc层改成fclass层         self.fclass = nn.Linear(2048, num_classes) #原来的fc层：self.fc = nn.Linear(512 * block.expansion, num_classes)        for m in self.modules(): #            if isinstance(m, nn.Conv2d):                 n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels #                m.weight.data.normal_(0, math.sqrt(2. / n))                 elif isinstance(m, nn.BatchNorm2d):                     m.weight.data.fill_(1)                     m.bias.data.zero_()                     def _make_layer(self, block, planes, blocks, stride=1):                         downsample = None                         if stride != 1 or self.inplanes != planes * block.expansion:                             downsample = nn.Sequential(                                 nn.Conv2d(self.inplanes, planes * block.expansion,                                           kernel_size=1, stride=stride, bias=False),                                 nn.BatchNorm2d(planes * block.expansion),                             )                             layers = [ ]                             layers.append(block(self.inplanes, planes, stride, downsample))                             self.inplanes = planes * block.expansion                             for i in range(1, blocks):                                 layers.append(block(self.inplanes, planes))                                 return nn.Sequential(*layers)                             def forward(self, x):                                 x = self.conv1(x)                                 x = self.bn1(x)                                 x = self.relu(x)                                 x = self.maxpool(x)                                 x = self.layer1(x)                                 x = self.layer2(x)                                 x = self.layer3(x)                                 x = self.layer4(x)                                 x = self.avgpool(x)                                 #3个新加层的forward                                 x = x.view(x.size(0), -1)                                 #因为接下来的self.convtranspose1层的输入通道是2048                                x = self.convtranspose1(x)                                 x = self.maxpool2(x)                                 x = x.view(x.size(0), -1)                                  #因为接下来的self.fclass层的输入通道是2048                                 x = self.fclass(x)                                 return x                            #加载model                             resnet50 = models.resnet50(pretrained=True)                             cnn = CNN(Bottleneck, [3, 4, 6, 3]) #创建一个自己新定义的网络对象cnn。

#微调全连接层model = torchvision.models.resnet18(pretrained=True)for param in model.parameters():    param.requires_grad = Falsemodel.fc = nn.Linear(512, 100)  # Replace the last fc layeroptimizer = torch.optim.SGD(model.fc.parameters(), lr=1e-2, momentum=0.9, weight_decay=1e-4)#以较大的学习率微调全连接层，较小的学习率微调卷积层model = torchvision.models.resnet18(pretrained=True)finetuned_parameters = list(map(id, model.fc.parameters()))conv_parameters = (p for p in model.parameters() if id(p) not in finetuned_parameters)parameters = [{'params': conv_parameters, 'lr': 1e-3},               {'params': model.fc.parameters()}]optimizer = torch.optim.SGD(parameters, lr=1e-2, momentum=0.9, weight_decay=1e-4)

.5. keypointrcnn_resnet50_fpn 模型使用

import torchimport torchvisionimport torch.nn as nndef get_model(num_kpts,train_kptHead=False,train_fpn=True):    is_available = torch.cuda.is_available()    device =torch.device('cuda:0' if is_available else 'cpu')    dtype = torch.cuda.FloatTensor if is_available else torch.FloatTensor    model = torchvision.models.detection.keypointrcnn_resnet50_fpn(pretrained=True)        for i,param in enumerate(model.parameters()):        param.requires_grad = False            if train_kptHead!=False:      for i, param in enumerate(model.roi_heads.keypoint_head.parameters()):          if i/2>=model.roi_heads.keypoint_head.__len__()/2-train_kptHead:            param.requires_grad = True    if train_fpn==True:      for param in model.backbone.fpn.parameters():        param.requires_grad = True    out = nn.ConvTranspose2d(512, num_kpts, kernel_size=(4, 4), stride=(2, 2), padding=(1, 1))    model.roi_heads.keypoint_predictor.kps_score_lowres = out        return model, device, dtype#model, device, dtype=get_model(2)

【AI】Pytorch_预训练模型的更多相关文章

【转载】最强NLP预训练模型！谷歌BERT横扫11项NLP任务记录
本文介绍了一种新的语言表征模型 BERT--来自 Transformer 的双向编码器表征.与最近的语言表征模型不同,BERT 旨在基于所有层的左.右语境来预训练深度双向表征.BERT 是首个在大批句 ...
BERT预训练模型的演进过程！(附代码)
1. 什么是BERT BERT的全称是Bidirectional Encoder Representation from Transformers,是Google2018年提出的预训练模型,即双向Tr ...
百度NLP预训练模型ERNIE2.0最强实操课程来袭！【附教程】
2019年3月,百度正式发布NLP模型ERNIE,其在中文任务中全面超越BERT一度引发业界广泛关注和探讨.经过短短几个月时间,百度ERNIE再升级,发布持续学习的语义理解框架ERNIE 2.0,及基 ...
ONNX预训练模型加载
tvm官网中,对从ONNX预训练模型中加载模型的教程说明教程来自于:https://docs.tvm.ai/tutorials/frontend/from_onnx.html#sphx-glr-tu ...
我的Keras使用总结（4）——Application中五款预训练模型学习及其应用
本节主要学习Keras的应用模块 Application提供的带有预训练权重的模型,这些模型可以用来进行预测,特征提取和 finetune,上一篇文章我们使用了VGG16进行特征提取和微调,下面尝试一 ...
【翻译】OpenVINO Pre-Trained 预训练模型介绍
OpenVINO 系列软件包预训练模型介绍本文翻译自 Intel OpenVINO 的 "Overview of OpenVINO Toolkit Pre-Trained Models& ...
【小白学PyTorch】5 torchvision预训练模型与数据集全览
文章来自:微信公众号[机器学习炼丹术].一个ai专业研究生的个人学习分享公众号文章目录: 目录 torchvision 1 torchvision.datssets 2 torchvision.mo ...
Paddle预训练模型应用工具PaddleHub
Paddle预训练模型应用工具PaddleHub 本文主要介绍如何使用飞桨预训练模型管理工具PaddleHub,快速体验模型以及实现迁移学习.建议使用GPU环境运行相关程序,可以在启动环境时,如下图所 ...
[.NET6]使用ML.NET+ONNX预训练模型整活B站经典《华强买瓜》
最近在看微软开源的机器学习框架ML.NET使用别人的预训练模型(开放神经网络交换格式.onnx)来识别图像,然后逛github发现一个好玩的repo.决定整活一期博客. 首先还是稍微科普一下机器学习相 ...

随机推荐

『心善渊』Selenium3.0基础 — 25、unittest单元测试框架
目录 1.unittest基本简介 2.unittest基本概念 (1)unittest核心的四个概念 (2)如何创建一个测试类 (3)test fixture常用的四个方法 (4)unittest编 ...
如何使用Meter-WebSocketSampler
安装 JMeter-WebSocketSampler 下载最新的 JMeter-WebSocketSampler,如 JMeterWebSocketSamplers-1.2.1.jar. 下载地址:h ...
雪花算法（SnowFlake）Java实现
分布式id生成算法的有很多种,Twitter的SnowFlake就是其中经典的一种. 算法原理 SnowFlake算法生成id的结果是一个64bit大小的整数,它的结构如下图: 1bit,不用,因为二 ...
传统.NET 4.x应用容器化体验（4）
上一篇我们试着将.NET 4.x的镜像推送到harbor私有镜像仓库,本篇我们来使用一下阿里云的镜像仓库服务并了解一下携程的实践. 1 关于阿里云镜像仓库阿里云容器镜像服务(简称 ACR)是面向容器 ...
Linux服务器相关性能的命令
Linux服务器相关性能的命令一.查看服务器性能信息的相关命令 1.cpu信息查看 cpu分为物理cpu和逻辑cpu 物理cpu:实际物理服务器插槽上cpu的个数,可以通过physical id不重 ...
java并发编程基础——线程通信
线程通信当线程在系统内运行时,程序通常无法准确的控制线程的轮换执行,但我们可以通过一些机制来保障线程的协调运行一.传统的线程通信传统的线程通信主要是通过Object类提供的wait(),noti ...
python -- 正则表达式&re模块（转载）
1. 正则表达式基础 1.1. 简单介绍正则表达式并不是Python的一部分.正则表达式是用于处理字符串的强大工具,拥有自己独特的语法以及一个独立的处理引擎,效率上可能不如str自带的方法,但功能十 ...
【LeetCode】94. 二叉树的中序遍历
94. 二叉树的中序遍历知识点:二叉树:递归:Morris遍历题目描述给定一个二叉树的根节点 root ,返回它的中序遍历. 示例输入:root = [1,null,2,3] 输出:[1, ...
POJ3662
poj3662 大意:n个点p条边的无向图,求在删去k条边后使1和n号点联通路径上的最长边最小值. 一开始理解错题意以为是分层图求最短路径,结果写完发现k太大了发现事情没有那么简单(讨厌英语题面!) ...
从redis数据库取数据存放到本地mysql数据库
redis数据库属于非关系型数据库,数据存放在内存堆栈中,效率比较高. 其存储数据是以json格式字符串存储字典的,而类似的关系型数据库无法实现这种数据的存储. 在爬取数据时,将数据暂存到redis中 ...

【AI】Pytorch_预训练模型

1. 模型下载

2. 模型查看

3. 模型初始化

.1. Xavier 均匀分布

.2. Xavier正态分布

.3. kaiming均匀分布

.4. kaiming 正态分布

.5. 均匀初始化分布

.6. 正态初始化分布

.7. 常数初始化

.8. 单位矩阵初始化

.9. 正交初始化

.10. 稀疏初始化

4. 构建模型

.1. nn.Sequential

.2. nn.ModuleList

.3. nn.ModuleDict

5. 使用预训练模型

.0. AlexNet 预训练模型修改

1. 直接使用AlexNet，并添加可视化

2. 修改Alexnet最后一层

.1. ResNet参数修改

.2. 增减卷积层

.3. ImageNet计算多层卷积特征

4. 训练特定层，冻结其它层

.5. keypointrcnn_resnet50_fpn 模型使用

【AI】Pytorch_预训练模型的更多相关文章

随机推荐

热门专题