YOLOV5改进：使用C2f_RepGhost模块替换C3_为什么使用c2f替换c3后参数量变多了

作者：知新_RL | 2024-04-04 11:23:02

踩

为什么使用c2f替换c3后参数量变多了

免费查看，个人自用

特征重用是轻量卷积神经网络设计的关键技术。当前的方法涌常利用连接运算符通过重用其他层的特征映射来廉价地保持大通道数(以而增加网络容量)。虽然连接不需要参数和fps，但它在硬件设备上的计算成本是不可忽略的。针对这一问题，本文提出了利用结构重参数化技术实现特征重用的新思路。

Ghost Bottleneck模块

改进步骤：

1.步骤一

在models文件夹下新建RepGhost.py文件，加入以下代码


import copy
import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
 
 
def _make_divisible(v, divisor, min_value=None):
    """
    This function is taken from the original tf repo.
    It ensures that all layers have a channel number that is divisible by 8 mg
    It can be seen here:
    https://github.com/tensorflow/models/blob/master/research/slim/nets/mobilenet/mobilenet.py
    """
    if min_value is None:
        min_value = divisor
    new_v = max(min_value, int(v + divisor / 2) // divisor * divisor)
    # Make sure that round down does not go down by more than 10%.
    if new_v < 0.9 * v:
        new_v += divisor
    return new_v
 
 
def hard_sigmoid(x, inplace: bool = False):
    if inplace:
        return x.add_(3.0).clamp_(0.0, 6.0).div_(6.0)
    else:
        return F.relu6(x + 3.0) / 6.0
 
 
class SqueezeExcite(nn.Module):
    def __init__(
        self,
        in_chs,
        se_ratio=0.25,
        reduced_base_chs=None,
        #act_layer=nn.ReLU,
        act_layer=nn.SiLU,
        gate_fn=hard_sigmoid,
        divisor=4,
        **_,
    ):
        super(SqueezeExcite, self).__init__()
        self.gate_fn = gate_fn
        reduced_chs = _make_divisible(
            (reduced_base_chs or in_chs) * se_ratio, divisor,
        )
        self.avg_pool = nn.AdaptiveAvgPool2d(1)
        self.conv_reduce = nn.Conv2d(in_chs, reduced_chs, 1, bias=True)
        self.act1 = act_layer(inplace=True)
        self.conv_expand = nn.Conv2d(reduced_chs, in_chs, 1, bias=True)
 
    def forward(self, x):
        x_se = self.avg_pool(x)
        x_se = self.conv_reduce(x_se)
        x_se = self.act1(x_se)
        x_se = self.conv_expand(x_se)
        x = x * self.gate_fn(x_se)
        return x
 
 
class ConvBnAct(nn.Module):
    def __init__(self, in_chs, out_chs, kernel_size, stride=1, act_layer=nn.SiLU):
        super(ConvBnAct, self).__init__()
        self.conv = nn.Conv2d(
            in_chs, out_chs, kernel_size, stride, kernel_size // 2, bias=False,
        )
        self.bn1 = nn.BatchNorm2d(out_chs)
        self.act1 = act_layer(inplace=True)
 
    def forward(self, x):
        x = self.conv(x)
        x = self.bn1(x)
        x = self.act1(x)
        return x
 
 
class RepGhostModule(nn.Module):
    def __init__(
        self, inp, oup, kernel_size=1, dw_size=3, stride=1, relu=True, deploy=False, reparam_bn=True, reparam_identity=False
    ):
        super(RepGhostModule, self).__init__()
        init_channels = oup
        new_channels = oup
        self.deploy = deploy
 
        self.primary_conv = nn.Sequential(
            nn.Conv2d(
                inp, init_channels, kernel_size, stride, kernel_size // 2, bias=False,
            ),
            nn.BatchNorm2d(init_channels),
            nn.SiLU(inplace=True) if relu else nn.Sequential(),
        )
        fusion_conv = []
        fusion_bn = []
        if not deploy and reparam_bn:
            fusion_conv.append(nn.Identity())
            fusion_bn.append(nn.BatchNorm2d(init_channels))
        if not deploy and reparam_identity:
            fusion_conv.append(nn.Identity())
            fusion_bn.append(nn.Identity())
 
        self.fusion_conv = nn.Sequential(*fusion_conv)
        self.fusion_bn = nn.Sequential(*fusion_bn)
 
        self.cheap_operation = nn.Sequential(
            nn.Conv2d(
                init_channels,
                new_channels,
                dw_size,
                1,
                dw_size // 2,
                groups=init_channels,
                bias=deploy,
            ),
            nn.BatchNorm2d(new_channels) if not deploy else nn.Sequential(),
            # nn.ReLU(inplace=True) if relu else nn.Sequential(),
        )
        if deploy:
            self.cheap_operation = self.cheap_operation[0]
        if relu:
            self.relu = nn.SiLU(inplace=False)
        else:
            self.relu = nn.Sequential()
 
    def forward(self, x):
        x1 = self.primary_conv(x)#mg
        x2 = self.cheap_operation(x1)
        for conv, bn in zip(self.fusion_conv, self.fusion_bn):
            x2 = x2 + bn(conv(x1))
        return self.relu(x2)
 
    def get_equivalent_kernel_bias(self):
        kernel3x3, bias3x3 = self._fuse_bn_tensor(self.cheap_operation[0], self.cheap_operation[1])
        for conv, bn in zip(self.fusion_conv, self.fusion_bn):
            kernel, bias = self._fuse_bn_tensor(conv, bn, kernel3x3.shape[0], kernel3x3.device)
            kernel3x3 += self._pad_1x1_to_3x3_tensor(kernel)
            bias3x3 += bias
        return kernel3x3, bias3x3
 
    @staticmethod
    def _pad_1x1_to_3x3_tensor(kernel1x1):
        if kernel1x1 is None:
            return 0
        else:
            return torch.nn.functional.pad(kernel1x1, [1, 1, 1, 1])
 
    @staticmethod
    def _fuse_bn_tensor(conv, bn, in_channels=None, device=None):
        in_channels = in_channels if in_channels else bn.running_mean.shape[0]
        device = device if device else bn.weight.device
        if isinstance(conv, nn.Conv2d):
            kernel = conv.weight
            assert conv.bias is None
        else:
            assert isinstance(conv, nn.Identity)
            kernel_value = np.zeros((in_channels, 1, 1, 1), dtype=np.float32)
            for i in range(in_channels):
                kernel_value[i, 0, 0, 0] = 1
            kernel = torch.from_numpy(kernel_value).to(device)
 
        if isinstance(bn, nn.BatchNorm2d):
            running_mean = bn.running_mean
            running_var = bn.running_var
            gamma = bn.weight
            beta = bn.bias
            eps = bn.eps
            std = (running_var + eps).sqrt()
            t = (gamma / std).reshape(-1, 1, 1, 1)
            return kernel * t, beta - running_mean * gamma / std
        assert isinstance(bn, nn.Identity)
        return kernel, torch.zeros(in_channels).to(kernel.device)
 
    def switch_to_deploy(self):
        if len(self.fusion_conv) == 0 and len(self.fusion_bn) == 0:
            return
        kernel, bias = self.get_equivalent_kernel_bias()
        self.cheap_operation = nn.Conv2d(in_channels=self.cheap_operation[0].in_channels,
                                         out_channels=self.cheap_operation[0].out_channels,
                                         kernel_size=self.cheap_operation[0].kernel_size,
                                         padding=self.cheap_operation[0].padding,
                                         dilation=self.cheap_operation[0].dilation,
                                         groups=self.cheap_operation[0].groups,
                                         bias=True)
        self.cheap_operation.weight.data = kernel
        self.cheap_operation.bias.data = bias
        self.__delattr__('fusion_conv')
        self.__delattr__('fusion_bn')
        self.fusion_conv = []
        self.fusion_bn = []
        self.deploy = True
 
class RepGhostBottleneck(nn.Module):
    """RepGhost bottleneck w/ optional SE"""
 
    def __init__(
        self,
        in_chs,
        mid_chs,
        out_chs,
        dw_kernel_size=3,
        stride=1,
        se_ratio=0.0,
        shortcut=True,
        reparam=True,
        reparam_bn=True,
        reparam_identity=False,
        deploy=False,
    ):
        super(RepGhostBottleneck, self).__init__()
        has_se = se_ratio is not None and se_ratio > 0.0
        self.stride = stride
        self.enable_shortcut = shortcut
        self.in_chs = in_chs
        self.out_chs = out_chs
 
        # Point-wise expansion
        self.ghost1 = RepGhostModule(
            in_chs,
            mid_chs,
            relu=True,
            reparam_bn=reparam and reparam_bn,
            reparam_identity=reparam and reparam_identity,
            deploy=deploy,
        )
 
        # Depth-wise convolution
        if self.stride > 1:
            self.conv_dw = nn.Conv2d(
                mid_chs,
                mid_chs,
                dw_kernel_size,
                stride=stride,
                padding=(dw_kernel_size - 1) // 2,
                groups=mid_chs,
                bias=False,
            )
            self.bn_dw = nn.BatchNorm2d(mid_chs)
 
        # Squeeze-and-excitation
        if has_se:
            self.se = SqueezeExcite(mid_chs, se_ratio=se_ratio)
        else:
            self.se = None
 
        # Point-wise linear projection
        self.ghost2 = RepGhostModule(
            mid_chs,
            out_chs,
            relu=False,
            reparam_bn=reparam and reparam_bn,
            reparam_identity=reparam and reparam_identity,
            deploy=deploy,
        )
 
        # shortcut
        if in_chs == out_chs and self.stride == 1:
            self.shortcut = nn.Sequential()
        else:
            self.shortcut = nn.Sequential(
                nn.Conv2d(
                    in_chs,
                    in_chs,
                    dw_kernel_size,
                    stride=stride,
                    padding=(dw_kernel_size - 1) // 2,
                    groups=in_chs,
                    bias=False,
                ),
                nn.BatchNorm2d(in_chs),
                nn.Conv2d(
                    in_chs, out_chs, 1, stride=1,
                    padding=0, bias=False,
                ),
                nn.BatchNorm2d(out_chs),
            )
 
    def forward(self, x):
        residual = x
        x1 = self.ghost1(x)
        if self.stride > 1:
            x = self.conv_dw(x1)
            x = self.bn_dw(x)
        else:
            x = x1
 
        if self.se is not None:
            x = self.se(x)
 
        # 2nd repghost bottleneck mg
        x = self.ghost2(x)
        if not self.enable_shortcut and self.in_chs == self.out_chs and self.stride == 1:
            return x
        return x + self.shortcut(residual)
 
 
# def repghost_model_convert(model:torch.nn.Module, save_path=None, do_copy=True):
#     """
#     taken from from https://github.com/DingXiaoH/RepVGG/blob/main/repvgg.py
#     """
#     if do_copy:
#         model = copy.deepcopy(model)
#     for module in model.modules():
#         if hasattr(module, 'switch_to_deploy'):
#             module.switch_to_deploy()
#     if save_path is not None:
#         torch.save(model.state_dict(), save_path)
#     return model
 
def repghost_model_convert(model:torch.nn.Module, save_path=None, do_copy=True):
    """
    taken from from https://github.com/DingXiaoH/RepVGG/blob/main/repvgg.py
    """
    if do_copy:
        model = copy.deepcopy(model)
    for module in model.modules():
        if hasattr(module, 'switch_to_deploy'):
            module.switch_to_deploy()
    if save_path is not None:
        torch.save(model, save_path)
    return model

2.步骤二

在common.py文件中加入如下代码


class C2frepghost(nn.Module):
    # CSP Bottleneck with 2 convolutions
    def __init__(self, c1, c2, n=1, shortcut=False, g=1, e=0.5):  # ch_in, ch_out, number, shortcut, groups, expansion
        super().__init__()
        self.c = int(c2 * e)  # hidden channels
        self.cv1 = Conv(c1, 2 * self.c, 1, 1)
        self.cv2 = Conv((2 + n) * self.c, c2, 1)  #
        self.m = nn.ModuleList(RepGhostBottleneck(self.c, self.c, self.c,dw_kernel_size=((3),(3))) for _ in range(n))
 
    def forward(self, x):
        y = list(self.cv1(x).split((self.c, self.c), 1))
        y.extend(m(y[-1]) for m in self.m)
        return self.cv2(torch.cat(y, 1))

3.步骤三

在yolo.py文件中加入以下代码：

4.步骤四

创建yaml文件：


# YOLOv5 声明：本文内容由网友自发贡献，不代表【wpsshop博客】立场，版权归原作者所有，本站不承担相应法律责任。如您发现有侵权的内容，请联系我们。转载请注明出处：https://www.wpsshop.cn/w/知新_RL/article/detail/358293
推荐阅读
articleyolov5+bytetrack算法在华为NPU上进行端到端开发_acllite dvpp...
自从毕业后开始进入了华为曻腾生态圈，现在越来越多的公司开始走国产化路线了，现在国内做AI芯片的厂商比如：寒武纪、地平线等...
                                    赞
踩
article项目总结：yolov5+bytrack 入侵检测...
yolov5+bytrack可以实现行人跟踪，每个人都会有一个ID，这就能很好的入侵人数做计算，或者能保存每个入侵者的图...
                                    赞
踩
article【实战项目】基于AidLux+YOLOv5+ByteTrack实现街道人流统计_yolov5 byt...
AidLux实现街道人流统计_yolov5 bytetrackyolov5 bytetrack             ...
                                    赞
踩
articleyolov5+bytetrack目标追踪，效果超过deepsort_yolov5 bytetrack...
Tracking-by-detection是MOT中的一个经典高效的流派，通过相似度（位置、外观、运动等信息）来关联检测...
                                    赞
踩
articleByteTrack+yolov5-6.2+流量统计_bytetrack更换yolov5...
ByteTrack+yolov5+流量统计：使用ByteTrack进行跟踪yolov5的目标，并根据标线进行流量计数_b...
                                    赞
踩
articleyolov5 DeepStream 实例总结_yolov5 bytetrack...
yolov5 DeepStream 实例总结_yolov5 bytetrackyolov5 bytetrack     ...
                                    赞
踩
article【YOLOv5】SPP、SPPF模块及添加ASPP模块...
文章目录YOLOv5配置文件SPP介绍YOLOv5中的SPPSPPFASPPpytorch中实现ASPP插入到YOLOv...
                                    赞
踩
articleSPP和SPPF（in YOLOv5）...
SPP是空间金字塔池化，作用是一个实现一个自适应尺寸的输出。（传统的池化层如最大池化、平均池化的输出大小是和输入大小挂钩...
                                    赞
踩
articlepytorch yolov5+Deepsort实现目标检测和跟踪+单目测距...
自动驾驶目标检测+目标跟踪+单目测距pytorch yolov5+Deepsort实现目标检测和跟踪+单目测距     ...
                                    赞
踩
articleYOLOV5-7.0推理代码精简版详解(去除了所有冗余代码只留了必要的)_yolov5精简代码...
目录如下：拿到代码后，先别管其他，python segment/predict.py一下。能运行成功，在扯其他。要不然都...
                                    赞
踩
article【yolov5 trick1】训练阶段和推理阶段图像分辨率的处理方法...
首先看github这一段话（链接https://github.com/ultralytics/yolov3/issues...
                                    赞
踩
article目标检测 YOLOv5 - 自定义的模型在使用C++推理时需要注意的问题_yolov5-v6.0 c...
目标检测 YOLOv5 - 自定义的模型在使用C++推理时需要注意的问题flyfish关注的YOLOv5的Python代...
                                    赞
踩
article【yolov5检测代码简化】Yolov5 detect.py推理代码简化，输入图片，输出图片和结果_...
最近的项目里有yolov5的嵌入，需求是只需要推理，模型文件是已有的，输入需要是图片（原yolov5是输入路径），输出结...
                                    赞
踩
articleYOLOv5-小知识记录(四)...
0. 写在前面  本篇介绍SPP模块、FPN模块模块，主要也是对YOLOv5的内容的补充：Yolo系列算法-理论部分-Y...
                                    赞
踩
articleYOLOv5 提升小目标识别能力 解决VisDrone2019数据集_yolov5测试visdron...
YOLOv5增加一些tricks技巧去提升它的小目标检测能力，进而在VisDrone无人机拍摄的这个数据集上达到更好的效...
                                    赞
踩
article【YOLOv8/YOLOv7/YOLOv5/YOLOv4/Faster-rcnn系列算法改进NO.6...
针对小目标检测有效果的一种新的动态稀疏注意力BiFormer_kv260 yolo v7kv260 yolo v7   ...
                                    赞
踩
article目标检测算法——YOLOv5/YOLOv7改进之结合ECA注意力机制_yolov7中添加eca注意力...
将即插即用的ECA注意力模块嵌入到YOLOv5网络中，减少模型参数，同时带来明显的性能提升。_yolov7中添加eca注...
                                    赞
踩
articleYOLOv5、YOLOv8改进结构系列：结合最新ICLR2022顶会的即插即用的动态卷积ODConv...
YOLOv5结合最新ICLR2022顶会的即插即用的动态卷积ODConv，全维度动态卷积有效提升精度，打造高性能检测_o...
                                    赞
踩
articleyolov5+车道线检测_yolov5车道线检测...
目标检测与车道线检测在自动驾驶以及车辆定位中起着重要的辅助作用，是环境感知中不可缺少的一个部分。基于深度学习的车道线检测...
                                    赞
踩
article目标检测算法（R-CNN，fast R-CNN，faster R-CNN，yolo，SSD，yolo...
目标检测算法（R-CNN，fast R-CNN，faster R-CNN，yolo，SSD，yoloV2，yoloV3，...
                                    赞
踩
相关标签
YOLO
人工智能
深度学习
android
pytorch
计算机视觉
cnn
python
目标检测
目标跟踪
数学建模
算法
机器学习
YOLOv5