caffe中的BatchNorm层

在训练一个小的分类网络时，发现加上BatchNorm层之后的检索效果相对于之前，效果会有提升，因此将该网络结构记录在这里，供以后查阅使用：

添加该层之前：

 layer {

   name: "conv1"

   type: "Convolution"

   bottom: "data"

   top: "conv1"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     kernel_size:

     stride:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu1"

   type: "ReLU"

   bottom: "conv1"

   top: "conv1"

 }

 layer {

   name: "pool1"

   type: "Pooling"

   bottom: "conv1"

   top: "pool1"

   pooling_param {

     pool: MAX

     kernel_size:

     stride:

   }

 }

 layer {

   name: "norm1"

   type: "LRN"

   bottom: "pool1"

   top: "norm1"

   lrn_param {

     local_size:

     alpha: 0.0001

     beta: 0.75

   }

 }

 layer {

   name: "conv2"

   type: "Convolution"

   bottom: "norm1"

   top: "conv2"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     kernel_size:

     stride:

     group:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu2"

   type: "ReLU"

   bottom: "conv2"

   top: "conv2"

 }

 layer {

   name: "pool2"

   type: "Pooling"

   bottom: "conv2"

   top: "pool2"

   pooling_param {

     pool: MAX

     kernel_size:

     stride:

   }

 }

 layer {

   name: "norm2"

   type: "LRN"

   bottom: "pool2"

   top: "norm2"

   lrn_param {

     local_size:

     alpha: 0.0001

     beta: 0.75

   }

 }

 layer {

   name: "conv3"

   type: "Convolution"

   bottom: "norm2"

   top: "conv3"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     stride:

     kernel_size:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu3"

   type: "ReLU"

   bottom: "conv3"

   top: "conv3"

 }

 layer {

   name: "conv4"

   type: "Convolution"

   bottom: "conv3"

   top: "conv4"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     kernel_size:

     group:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu4"

   type: "ReLU"

   bottom: "conv4"

   top: "conv4"

 }

 layer {

   name: "conv5"

   type: "Convolution"

   bottom: "conv4"

   top: "conv5"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     stride:

     kernel_size:

     group:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu5"

   type: "ReLU"

   bottom: "conv5"

   top: "conv5"

 }

 layer {

   name: "pool5"

   type: "Pooling"

   bottom: "conv5"

   top: "pool5"

   pooling_param {

     pool: MAX

     kernel_size:

     stride:

   }

 }

 layer {

   name: "fc6_srx"

   type: "InnerProduct"

   bottom: "pool5"

   top: "fc6"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   inner_product_param {

     num_output:

     weight_filler {

       type: "gaussian"

       std: 0.005

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu7"

   type: "ReLU"

   bottom: "fc6"

   top: "fc6"

 }

 layer {

   name: "drop7"

   type: "Dropout"

   bottom: "fc6"

   top: "fc6"

   dropout_param {

     dropout_ratio: 0.5

   }

 }

 layer {

   name: "fc7_srx"

   type: "InnerProduct"

   bottom: "fc6"

   top: "fc7"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   inner_product_param {

     num_output:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer{

   name: "loss"

   type: "SoftmaxWithLoss"

   top: "SoftmaxWithLoss"

   bottom: "fc7"

   bottom: "label"

   include {

     phase: TRAIN

   }

 }

 layer {

   name: "accuracy"

   type: "Accuracy"

   bottom: "fc7"

   bottom: "label"

   top: "accuracy"

   include {

     phase: TEST

   }

 }

添加该层之后：

 layer {

   name: "conv1"

   type: "Convolution"

   bottom: "data"

   top: "conv1"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     kernel_size:

     stride:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 ##############

 layer {

   bottom: "conv1"

   top: "conv1"

   name: "bn1"

   type: "BatchNorm"

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

 }

 ##############

 layer {

   name: "relu1"

   type: "ReLU"

   bottom: "conv1"

   top: "conv1"

 }

 layer {

   name: "pool1"

   type: "Pooling"

   bottom: "conv1"

   top: "pool1"

   pooling_param {

     pool: MAX

     kernel_size:

     stride:

   }

 }

 layer {

   name: "conv2"

   type: "Convolution"

   bottom: "pool1"

   top: "conv2"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     kernel_size:

     stride:

     group:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 ##############

 layer {

   bottom: "conv2"

   top: "conv2"

   name: "bn2"

   type: "BatchNorm"

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

 }

 ##############

 layer {

   name: "relu2"

   type: "ReLU"

   bottom: "conv2"

   top: "conv2"

 }

 layer {

   name: "pool2"

   type: "Pooling"

   bottom: "conv2"

   top: "pool2"

   pooling_param {

     pool: MAX

     kernel_size:

     stride:

   }

 }

 layer {

   name: "conv3"

   type: "Convolution"

   bottom: "pool2"

   top: "conv3"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     stride:

     kernel_size:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 ##############

 layer {

   bottom: "conv3"

   top: "conv3"

   name: "bn3"

   type: "BatchNorm"

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

 }

 ##############

 layer {

   name: "relu3"

   type: "ReLU"

   bottom: "conv3"

   top: "conv3"

 }

 layer {

   name: "conv4"

   type: "Convolution"

   bottom: "conv3"

   top: "conv4"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     kernel_size:

     group:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 ##############

 layer {

   bottom: "conv4"

   top: "conv4"

   name: "bn4"

   type: "BatchNorm"

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

 }

 ##############

 layer {

   name: "relu4"

   type: "ReLU"

   bottom: "conv4"

   top: "conv4"

 }

 layer {

   name: "conv5"

   type: "Convolution"

   bottom: "conv4"

   top: "conv5"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   convolution_param {

     num_output:

     pad:

     stride:

     kernel_size:

     group:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 ##############

 layer {

   bottom: "conv5"

   top: "conv5"

   name: "bn5"

   type: "BatchNorm"

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

   param {

     lr_mult:

   }

 }

 ##############

 layer {

   name: "relu5"

   type: "ReLU"

   bottom: "conv5"

   top: "conv5"

 }

 layer {

   name: "pool5"

   type: "Pooling"

   bottom: "conv5"

   top: "pool5"

   pooling_param {

     pool: MAX

     kernel_size:

     stride:

   }

 }

 layer {

   name: "fc6_srx"

   type: "InnerProduct"

   bottom: "pool5"

   top: "fc6"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   inner_product_param {

     num_output:

     weight_filler {

       type: "gaussian"

       std: 0.005

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer {

   name: "relu7"

   type: "ReLU"

   bottom: "fc6"

   top: "fc6"

 }

 layer {

   name: "drop7"

   type: "Dropout"

   bottom: "fc6"

   top: "fc6"

   dropout_param {

     dropout_ratio: 0.5

   }

 }

 layer {

   name: "fc7_srx"

   type: "InnerProduct"

   bottom: "fc6"

   top: "fc7"

   param {

     lr_mult:

     decay_mult:

   }

   param {

     lr_mult:

     decay_mult:

   }

   inner_product_param {

     num_output:

     weight_filler {

       type: "gaussian"

       std: 0.01

     }

     bias_filler {

       type: "constant"

       value:

     }

   }

 }

 layer{

   name: "loss"

   type: "SoftmaxWithLoss"

   top: "SoftmaxWithLoss"

   bottom: "fc7"

   bottom: "label"

   include {

     phase: TRAIN

   }

 }

 layer {

   name: "accuracy"

   type: "Accuracy"

   bottom: "fc7"

   bottom: "label"

   top: "accuracy"

   include {

     phase: TEST

   }

 }

caffe中的BatchNorm层的更多相关文章

（原）torch和caffe中的BatchNorm层
转载请注明出处: http://www.cnblogs.com/darkknightzh/p/6015990.html BatchNorm具体网上搜索. caffe中batchNorm层是通过Batc ...
caffe 中 python 数据层
caffe中大多数层用C++写成. 但是对于自己数据的输入要写对应的输入层,比如你要去图像中的一部分,不能用LMDB,或者你的label 需要特殊的标记. 这时候就需要用python 写一个输入层. ...
caffe中全卷积层和全连接层训练参数如何确定
今天来仔细讲一下卷基层和全连接层训练参数个数如何确定的问题.我们以Mnist为例,首先贴出网络配置文件: name: "LeNet" layer { name: "mni ...
caffe中添加local层
下载caffe-local,解压缩; 修改makefile.config:我是将cuudn注释掉,去掉cpu_only的注释; make all make test(其中local_test出错,将文 ...
转载：caffe中的Reshape层
http://blog.csdn.net/terrenceyuu/article/details/76228317 #作用:在不改变数据的情况下,改变输入的维度 layer { name: " ...
caffe中各层的作用:
关于caffe中的solver: cafffe中的sover的方法都有: Stochastic Gradient Descent (type: "SGD"), AdaDelta ( ...
深度学习中 batchnorm 层是咋回事？
作者:Double_V_ 来源:CSDN 原文:https://blog.csdn.net/qq_25737169/article/details/79048516 版权声明:本文为博主原创文章,转载 ...
caffe中ConvolutionLayer的前向和反向传播解析及源码阅读
一.前向传播在caffe中,卷积层做卷积的过程被转化成了由卷积核的参数组成的权重矩阵weights(简记为W)和feature map中的元素组成的输入矩阵(简记为Cin)的矩阵乘积W * Cin. ...
caffe中batch norm源码阅读
1. batch norm 输入batch norm层的数据为[N, C, H, W], 该层计算得到均值为C个,方差为C个,输出数据为[N, C, H, W]. <1> 形象点说,均值的 ...

随机推荐

前端小知识（转载http://www.cnblogs.com/Wayou/p/things_you_dont_know_about_frontend.html）
前端已经被玩儿坏了!像console.log()可以向控制台输出图片等炫酷的玩意已经不是什么新闻了,像用||操作符给变量赋默认值也是人尽皆知的旧闻了,今天看到Quora上一个帖子,瞬间又GET了好多前 ...
node06-path
目录:node01-创建服务器 node02-util node03-events node04-buffer node05-fs node06-path node07-http node08-exp ...
Android杂记：genymotion与eclipse报错问题
用eclipse启动genymotion时有时候会报 The connection to adb is down, and a severe error has occured. You must r ...
iOS文件类型判断
最近在做的东西有下载zip,只是服务器发送过来的是二进制,需要根据二进制来判断是什么类型的文件,从而进行保存操作.起初很不理解,到后来发现可以通过二进制的前2位的ascii码来进行判断.如下: // ...
监测程序运行的时间，stopWatch
ArrayList arrInt = new ArrayList(); //用stopwatch来计时运行的时间 Stopwatch watch = new Stopwatch(); watch.S ...
JDK常用工具集——jps
该命令的作用是罗列出目标系统(target system)中所有具有访问权限到的Java进程. 一.命令简介: jps [option] [hostid] 二.参数说明: option ...
[leetcode] 12. Integer to Roman
关于罗马数字: I: 1V: 5X: 10L: 50C: 100D: 500M: 1000字母可以重复,但不超过三次,当需要超过三次时,用与下一位的组合表示:I: 1, II: 2, III: 3, ...
Android 控件的显示隐藏上下左右移动动画
一.利用Android提供的左右移动工具类:AnimationUtils 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 LinearLayout ll_fi ...
abort 用法讨论
同事说: TT***.factary( procedure() begin .... abort; .... end)大家在TTask中不建议用abort因为难以控制,我测试 ...
Listener refused the connection with the following error 错误解决
原文地址 :http://blog.csdn.net/zajin/article/details/17753351 做个备份: 查询数据库当前进程的连接数: select count(*) from ...

caffe中的BatchNorm层

caffe中的BatchNorm层的更多相关文章

随机推荐

热门专题