YOLO v2 cfg文件参数

[net]
batch=64                           每次迭代要进行训练的图片数量
subdivisions=8                     如果内存不够大，将batch分割为subdivisions个子batch，每个子batch的大小为batch/subdivisions。
                                   在darknet代码中，会将batch/subdivisions命名为batch。
height=416                         input图像的高
width=416                          Input图像的宽
channels=3                         Input图像的通道数
momentum=0.9                       动量
decay=0.0005                       权重衰减正则项，防止过拟合
angle=0                            图片角度变化，单位为度，假如angle=5，就是生成新图片的时候随机旋转-5~5度 
saturation = 1.5                   饱和度与曝光变化大小，tiny-yolo-voc.cfg中1到1.5倍，以及1/1.5~1倍 
exposure = 1.5                     同上
hue=.1                             色调变化范围，tiny-yolo-voc.cfg中-0.1~0.1

learning_rate=0.0001               初始学习率

burn_in=1000                       ???
max_batches = 45000                训练达到max_batches后停止学习
policy=steps                       调整学习率的policy，有如下policy：CONSTANT, STEP, EXP, POLY, STEPS, SIG, RANDOM
steps=100,25000,35000              根据batch_num调整学习率
scales=10,.1,.1                    学习率变化的比例，累计相乘

[convolutional]
batch_normalize=1                  是否做BN
filters=32                         输出多少个特征图
size=3                             卷积核的尺寸
stride=1                           做卷积运算的步长
pad=1                              如果pad为0,padding由 padding参数指定。如果pad为1，padding大小为size/2
activation=leaky                   激活函数：
                                   logistic，loggy，relu，elu，relie，plse，hardtan，lhtan，linear，ramp，leaky，tanh，stair

[maxpool]
size=2                             池化层尺寸
stride=2                           池化步进

[convolutional]
batch_normalize=1
filters=64
size=3
stride=1
pad=1
activation=leaky

[maxpool]
size=2
stride=2

......
......


#######

[convolutional]
batch_normalize=1
size=3
stride=1
pad=1
filters=1024
activation=leaky

[convolutional]
batch_normalize=1
size=3
stride=1
pad=1
filters=1024
activation=leaky

[route]                            the route layer is to bring finer grained features in from earlier in the network
layers=-9

[reorg]                            the reorg layer is to make these features match the feature map size at the later layer. 
                                   The end feature map is 13x13, the feature map from earlier is 26x26x512. 
                                   The reorg layer maps the 26x26x512 feature map onto a 13x13x2048 feature map 
                                   so that it can be concatenated with the feature maps at 13x13 resolution.
stride=2

[route]
layers=-1,-3

[convolutional]
batch_normalize=1
size=3
stride=1
pad=1
filters=1024
activation=leaky

[convolutional]
size=1
stride=1
pad=1
filters=125                        region前最后一个卷积层的filters数是特定的，计算公式为filter=num*(classes+5) 
                                   5的意义是5个坐标，论文中的tx,ty,tw,th,to
activation=linear

[region]
anchors = 1.08,1.19,  3.42,4.41,  6.63,11.38,  9.42,5.11,  16.62,10.52          预选框，可以手工挑选，也可以通过k means;从训练样本中学出预测框的初始宽高，第一个是w，第二个是h，总数量是num*2，YOLOv2作者说anchors是使用K-MEANS获得，其实就是计算出哪种类型的框比较多，可以增加收敛速度，如果不设置anchors，默认是0.5，还有就是anchors读入参数中名字是biases 
bias_match=1                       如果为1，计算best iou时，预测宽高强制与anchors一致
classes=20                         类别数量
coords=4                           BoundingBox的tx,ty,tw,th，tx与ty是相对于左上角的gird，同时是当前grid的比例，tw与th是宽度与高度取对数
num=5                              每个grid预测的BoundingBox个数
softmax=1                          为1时，使用softmax做激活函数
jitter=.2                          利用数据抖动产生更多数据，YOLOv2中使用的是crop，filp，以及net层的angle，flip是随机的，crop就是jitter的参数，tiny-yolo-voc.cfg中jitter=.2，就是在0~0.2中进行crop 
rescore=1                          决定使用哪种方式计算IOU的误差，为1时，使用当前best iou计算，为0时，使用1计算；
object_scale=5                     栅格中有物体时，bbox的confidence loss对总loss计算贡献的权重；
noobject_scale=1                   栅格中没有物体时，bbox的confidence loss对总loss计算贡献的权重
class_scale=1                      类别loss对总loss计算贡献的权重                      
coord_scale=1                      bbox坐标预测loss对总loss计算贡献的权重
                                   YOLOv1论文中cost function的权重，哪一个更大，每一次更新权重的时候，对应方面的权重更新相对比重更大 
absolute=1
thresh = .6                        决定是否需要计算IOU误差的参数，大于thresh，IOU误差不会夹在cost function中
random=0                           random为1时会启用Multi-Scale Training，随机使用不同尺寸的图片进行训练。如果为1每次迭代图片大小随机从320到608，步长为32，如果为0，每次训练大小与输入大小一致

参考：https://blog.csdn.net/fate_fjh/article/details/70598510

https://blog.csdn.net/hrsstudy/article/details/65447947

https://github.com/AlexeyAB/darknet/issues/279

<HSV >https://github.com/AlexeyAB/darknet/issues/740

YOLO v2 cfg文件参数

猜你喜欢