更改YOLOV5的backbone网络为 Shufflenetv2,便于达到轻量化的目的
1. 试运行YOLOv5
2. VOC数据集处理
3. 更改轻量级网络
3.1 在common.py末尾加入以下代码
# ---------------------------- ShuffleBlock start -------------------------------
# 通道重排,跨group信息交流
def channel_shuffle(x, groups):
batchsize, num_channels, height, width = x.data.size()
channels_per_group = num_channels // groups
# reshape
x = x.view(batchsize, groups,
channels_per_group, height, width)
x = torch.transpose(x, 1, 2).contiguous()
# flatten
x = x.view(batchsize, -1, height, width)
return x
class conv_bn_relu_maxpool(nn.Module):
def __init__(self, c1, c2): # ch_in, ch_out
super(conv_bn_relu_maxpool, self).__init__()
self.conv = nn.Sequential(
nn.Conv2d(c1, c2, kernel_size=3, stride=2, padding=1, bias=False),
self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
def forward(self, x):
return self.maxpool(self.conv(x))
class Shuffle_Block(nn.Module):
def __init__(self, inp, oup, stride):
super(Shuffle_Block, self).__init__()
if not (1 <= stride <= 3):
raise ValueError('illegal stride value')
self.stride = stride
branch_features = oup // 2
assert (self.stride != 1) or (inp == branch_features << 1)
if self.stride > 1:
self.branch1 = nn.Sequential(
self.depthwise_conv(inp, inp, kernel_size=3, stride=self.stride, padding=1),
nn.Conv2d(inp, branch_features, kernel_size=1, stride=1, padding=0, bias=False),
self.branch2 = nn.Sequential(
nn.Conv2d(inp if (self.stride > 1) else branch_features,
branch_features, kernel_size=1, stride=1, padding=0, bias=False),
self.depthwise_conv(branch_features, branch_features, kernel_size=3, stride=self.stride, padding=1),
nn.Conv2d(branch_features, branch_features, kernel_size=1, stride=1, padding=0, bias=False),
def depthwise_conv(i, o, kernel_size, stride=1, padding=0, bias=False):
return nn.Conv2d(i, o, kernel_size, stride, padding, bias=bias, groups=i)
def forward(self, x):
if self.stride == 1:
x1, x2 = x.chunk(2, dim=1) # 按照维度1进行split
out = torch.cat((x1, self.branch2(x2)), dim=1)
out = torch.cat((self.branch1(x), self.branch2(x)), dim=1)
out = channel_shuffle(out, 2)
return out
# ---------------------------- ShuffleBlock end --------------------------------
3.2 在yolo.py parse_model里面添加新的模块
#新加模块conv_bn_relu_maxpool, Shuffle_Block
3.3 在model文件目录下新建yolov5.0s_shufflenetv2.yaml
# parameters
nc: 20 # number of classes
depth_multiple: 0.33 # model depth multiple
width_multiple: 0.50 # layer channel multiple
# anchors
- [10,13, 16,30, 33,23] # P3/8
- [30,61, 62,45, 59,119] # P4/16
- [116,90, 156,198, 373,326] # P5/32
# YOLOv5 backbone
# [from, number, module, args]
# Shuffle_Block: [out, stride]
[[ -1, 1, conv_bn_relu_maxpool, [ 32 ] ], # 0-P2/4
[ -1, 1, Shuffle_Block, [ 128, 2 ] ], # 1-P3/8
[ -1, 3, Shuffle_Block, [ 128, 1 ] ], # 2
[ -1, 1, Shuffle_Block, [ 256, 2 ] ], # 3-P4/16
[ -1, 7, Shuffle_Block, [ 256, 1 ] ], # 4
[ -1, 1, Shuffle_Block, [ 512, 2 ] ], # 5-P5/32
[ -1, 3, Shuffle_Block, [ 512, 1 ] ], # 6
[ -1, 1, Conv, [ 1024, 3, 2 ] ], # 7-P5/32
[ -1, 1, SPP, [ 1024, [ 5, 9, 13 ] ] ],# 8
[ -1, 3, C3, [ 1024, False ] ], # 9
# YOLOv5 v5.0 head
[[-1, 1, Conv, [512, 1, 1]], # 10
[-1, 1, nn.Upsample, [None, 2, 'nearest']],# 11
[[-1, 6], 1, Concat, [1]], # cat backbone P4 # 12
[-1, 3, C3, [512, False]], # 13
[-1, 1, Conv, [256, 1, 1]], # 14
[-1, 1, nn.Upsample, [None, 2, 'nearest']], # 15
[[-1, 4], 1, Concat, [1]], # cat backbone P3 # 16
[-1, 3, C3, [256, False]], # 17 (P3/8-small)
[-1, 1, Conv, [256, 3, 2]], # 18
[[-1, 14], 1, Concat, [1]], # cat head P4 # 19
[-1, 3, C3, [512, False]], # 20(P4/16-medium)
[-1, 1, Conv, [512, 3, 2]],# 21
[[-1, 10], 1, Concat, [1]], # cat head P5
[-1, 3, C3, [1024, False]], # 23 (P5/32-large)
[[13, 17, 23], 1, Detect, [nc, anchors]], # Detect(P3, P4, P5)
3.4 更改train.py设置训练参数
4. 迁移学习训练改后网络
freeze = [] # parameter names to freeze (full or partial)
freeze = ['model.%s.' % x for x in range(10,24)] # parameter names to freeze (full or partial)
for k, v in model.named_parameters():
v.requires_grad = True # train all layers
if any(x in k for x in freeze):
print('freezing %s' % k)
v.requires_grad = False
freeze = ['model.%s.' % x for x in range(10,24)] # parameter names to freeze (full or partial)
for k, v in model.named_parameters():
v.requires_grad = True # train all layers
if any(x in k for x in freeze):
print('freezing %s' % k)
v.requires_grad = False
Class Images Labels P R mAP@.5 mAP@.5:.95: 100%|██████████| 155/155 [00:56<00:00, 2.73it/s]
all 4952 12032 0.683 0.607 0.648 0.394
aeroplane 4952 285 0.712 0.663 0.715 0.438
bicycle 4952 337 0.853 0.706 0.779 0.49
bird 4952 459 0.603 0.547 0.564 0.315
boat 4952 263 0.599 0.556 0.582 0.275
bottle 4952 469 0.524 0.301 0.322 0.156
bus 4952 213 0.783 0.657 0.736 0.578
car 4952 1201 0.777 0.749 0.805 0.549
cat 4952 358 0.734 0.703 0.754 0.513
chair 4952 756 0.5 0.374 0.375 0.187
cow 4952 244 0.675 0.52 0.588 0.335
diningtable 4952 206 0.703 0.544 0.624 0.404
dog 4952 489 0.672 0.578 0.646 0.398
horse 4952 348 0.742 0.747 0.776 0.47
motorbike 4952 325 0.821 0.734 0.804 0.49
person 4952 4528 0.774 0.687 0.764 0.409
pottedplant 4952 480 0.605 0.388 0.418 0.173
sheep 4952 242 0.515 0.677 0.603 0.37
sofa 4952 239 0.653 0.569 0.601 0.385
train 4952 282 0.753 0.766 0.821 0.517
tvmonitor 4952 308 0.672 0.672 0.69 0.42
100 epochs completed in 7.559 hours.
Optimizer stripped from runs\train\exp23\weights\last.pt, 12.3MB
Optimizer stripped from runs\train\exp23\weights\best.pt, 12.3MB