12.12 深度学习-卷积的注意力机制-通道注意力SENet

# 告诉模型训练的时候对某个东西给予额外的注意额外的权重参数分配注意力

# 不重要的就抑制降低权重参数比如有些项目颜色重要有些是形状重要

# 通道注意力一般都要比较多的通道加注意力

# SENet

# 把上层的特征图自动卷积为 1X1的通道数不变的特征图然后给每一个通道乘一个权重就分配了各个通道的注意力把这个与原图残差回去与原图融合这样对比原图来说形状 CHW都没变

# 注意力机制可以即插即用 CHW都没变

import torch

import os

import torch.nn as nn

from torchvision.models import resnet18,ResNet18_Weights

from torchvision.models.resnet import _resnet,BasicBlock

path=os.path.dirname(__file__)

onnxpath=os.path.join(path,"assets/resnet_SE-Identity.onnx")

onnxpath=os.path.relpath(onnxpath)

class SENet1(nn.Module):

def __init__(self,inchannel,r=16):

super().__init__()

# 全局平均池化把所以通道整个通道进行平均池化

self.inchannel=inchannel

self.pool1=nn.AdaptiveAvgPool2d(1)

# 对全局平均池化后的结果赋予每个通道的权重不选择最大池化因为不是在突出最大的特征

# 这里不是直接一个全连接生成权重而是用两个全连接来生成权重第一个relu激活第二个Sigmoid 为每一个通道生成一个0-1的权重

# 第一个全连接输出的通道数数量要缩小一下，不能直接传入多少就输出多少，不然参数量太多，第二个通道再输出回去就行

# 缩放因子

self.fc1=nn.Sequential(nn.Linear(self.inchannel,self.inchannel//r),nn.ReLU())

self.fc2=nn.Sequential(nn.Linear(self.inchannel//r,self.inchannel),nn.Sigmoid())

# fc1 用relu会信息丢失保证inchannel//r 至少要32

# 用两层全连接可以增加注意力层的健壮性

def forward(self,x):

x1=self.pool1(x)

x1=x1.view(x1.shape[0],-1)

x1=self.fc1(x1)

x1=self.fc2(x1)

# 得到了每一个通道的权重

x1=x1.unsqueeze(2).unsqueeze(3)

# 与原来的相乘

return x*x1

def demo1():

torch.manual_seed(666)

img1=torch.rand(1,128,224,224)

senet1=SENet1(img1.shape[1],2)

res=senet1.forward(img1)

print(res.shape)

# 可以把SE模块加入到经典的CNN模型里面有残差模块的在残差模块后面加入SE 残差模块的输出当SE模块的输入

# 在卷积后的数据与原数据相加之前把卷积的数据和依靠卷积后的数据产生的SE模块的数据相乘然后再与原数据相加

# 这个要看源码进行操作

# 也可以不在残差后面进行有很多种插入SE的方式

# 要找到网络的残差模块

def demo2():

# 把SE模块加入到ResNet18

# 继承一个BasicBlock类对resnet18的残差模块进行一些重写

class BasicBlock_SE(BasicBlock):

def __init__(self, inplanes, planes, stride = 1, downsample = None, groups = 1, base_width = 64, dilation = 1, norm_layer = None):

super().__init__(inplanes, planes, stride, downsample, groups, base_width, dilation, norm_layer)

self.se=SENet1(inplanes)# SE-Identity 加法在数据传进来的时候备份两份数据一份卷积一份加注意力SE模块然后两个结果相加输出

def forward(self, x):

identity = x

identity=self.se(x)

out = self.conv1(x)

out = self.bn1(out)

out = self.relu(out)

out = self.conv2(out)

out = self.bn2(out)

if self.downsample is not None:

identity = self.downsample(identity)

out += identity

out = self.relu(out)

return out

# self.se=SENet1(planes)# SE-POST 加法在残差模块彻底完成了后加注意力SE模块然后结果输出

# def forward(self, x):

# identity = x

# out = self.conv1(x)

# out = self.bn1(out)

# out = self.relu(out)

# out = self.conv2(out)

# out = self.bn2(out)

# if self.downsample is not None:

# identity = self.downsample(x)

# out += identity

# out = self.relu(out)

# out=self.se(out)

# return out

# self.se=SENet1(inplanes)# SE-PRE 加法在残差模块卷积之前加注意力SE模块然后结果输出

# def forward(self, x):

# identity = x

# out=self.se(x)

# out = self.conv1(out)

# out = self.bn1(out)

# out = self.relu(out)

# out = self.conv2(out)

# out = self.bn2(out)

# if self.downsample is not None:

# identity = self.downsample(x)

# out += identity

# out = self.relu(out)

# return out

# self.se=SENet1(planes)# Standard_SE 加法在残差模块卷积h后加注意力SE模块然后与原数据项加结果输出

# def forward(self, x):

# identity = x

# out = self.conv1(x)

# out = self.bn1(out)

# out = self.relu(out)

# out = self.conv2(out)

# out = self.bn2(out)

# if self.downsample is not None:

# identity = self.downsample(x)

# out=self.se(out)

# out += identity

# out = self.relu(out)

# return out

def resnet18_SE(*, weights= None, progress: bool = True, **kwargs):

weights = ResNet18_Weights.verify(weights)

return _resnet(BasicBlock_SE, [2, 2, 2, 2], weights, progress, **kwargs)

model1=resnet18_SE()

x = torch.randn(1, 3, 224, 224)

# 导出onnx

torch.onnx.export(

model1,

onnxpath,

verbose=True, # 输出转换过程

input_names=["input"],

output_names=["output"],

)

print("onnx导出成功")

# SE在模型的早期层并没有起多大的作用在后期层中加 SE机制效果明显且参数更少

# 改模型不仅需要加一个网络结构而且也需要注意前向传播有没有问题

def demo3(): # 在resnet18中的后期层里面加 SE 前期层不加

class ResNet_SE_laye(ResNet):

def __init__(self, block, layers, num_classes = 1000, zero_init_residual = False, groups = 1, width_per_group = 64, replace_stride_with_dilation = None, norm_layer = None):

super().__init__(block, layers, num_classes, zero_init_residual, groups, width_per_group, replace_stride_with_dilation, norm_layer)

def _layer_update_SE(self):

self.se=SENet1(self.layer3[1].conv2.out_channels,8)

self.layer3[1].conv2=nn.Sequential(self.layer3[1].conv2,self.se)

print(self.layer3)

pass

return self.layer3

def _resnet_SE_layer(

block,

layers,

weights,

progress: bool,

**kwargs,

if weights is not None:

_ovewrite_named_param(kwargs, "num_classes", len(weights.meta["categories"]))

model = ResNet_SE_laye(block, layers, **kwargs)

if weights is not None:

model.load_state_dict(weights.get_state_dict(progress=progress, check_hash=True))

return model

def resnet18_SE_layer(*, weights= None, progress: bool = True, **kwargs):

weights = ResNet18_Weights.verify(weights)

return _resnet_SE_layer(BasicBlock, [2, 2, 2, 2], weights, progress, **kwargs)

model=resnet18_SE_layer()

# print(model)

layer=model._layer_update_SE()

torch.onnx.export(layer,torch.rand(1,128,224,224),"layer.onnx")

pass

if __name__=="__main__":

# demo1()

# demo2()

pass

本文来自互联网用户投稿，该文观点仅代表作者本人，不代表本站立场。本站仅提供信息存储空间服务，不拥有所有权，不承担相关法律责任。如若转载，请注明出处：http://www.mzph.cn/news/889875.shtml

如若内容造成侵权/违法违规/事实不符，请联系多彩编程网进行投诉反馈email:809451989@qq.com，一经查实，立即删除！

12.12 深度学习-卷积的注意力机制-通道注意力SENet

相关文章

使用 Python 从 ROS Bag 中提取图像：详解与实现

【Bolt.new + PromptCoder】三分钟还原油管主页

【小白你好】深度学习的认识和应用：CNN、GNN、LSTM、Transformer、GAN与DRL的对比分析

定时/延时任务-万字解析Spring定时任务原理

JumpServer开源堡垒机搭建及使用

单目动态新视角合成

ResNet网络：深度学习中的革命性架构

如何在Playwright中操作窗口的变化

【GoF23种设计模式】02_单例模式（Singleton Pattern）

Node.js day-01

又要考试了

LoadBalancer负载均衡和Nginx负载均衡区别理解

Linux shell脚本练习(六)

【MQTT 编程】-API

Technitium DNS Server的基本使用1(创建主区域，A记录，开启递归查询，递归到114.114.114.114)

OpenAI 与 ChatGPT 的关系解析

Git简介和特点

CSS学习记录15

《国产单片机，soc的一些现实问题》

AdminJS - 现代化的 Node.js 管理面板框架详解