MAGNet -MAFM 多尺度感知融合模組

iceeci發表於2024-11-27

原文網址 : https://www.cnblogs.com/plumIce/p/18573242

import math
import torch.nn as nn
import torch
from timm.models.layers import trunc_normal_

class COI(nn.Module):
    def __init__(self, inc, k=3, p=1):
        super().__init__()
        self.outc = inc
        self.dw = nn.Conv2d(inc, self.outc, kernel_size=k, padding=p, groups=inc)
        self.conv1_1 = nn.Conv2d(inc, self.outc, kernel_size=1, stride=1)
        self.bn1 = nn.BatchNorm2d(self.outc)
        self.bn2 = nn.BatchNorm2d(self.outc)
        self.bn3 = nn.BatchNorm2d(self.outc)
        self.act = nn.GELU()
        self.apply(self._init_weights)

    def forward(self, x):
        shortcut = self.bn1(x)

        x_dw = self.bn2(self.dw(x))
        x_conv1_1 = self.bn3(self.conv1_1(x))
        return self.act(shortcut + x_dw + x_conv1_1)

    def _init_weights(self, m):
        if isinstance(m, nn.Linear):
            trunc_normal_(m.weight, std=.02)
            if isinstance(m, nn.Linear) and m.bias is not None:
                nn.init.constant_(m.bias, 0)
        elif isinstance(m, nn.LayerNorm):
            nn.init.constant_(m.bias, 0)
            nn.init.constant_(m.weight, 1.0)
        elif isinstance(m, nn.Conv2d):
            fan_out = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
            fan_out //= m.groups
            m.weight.data.normal_(0, math.sqrt(2.0 / fan_out))
            if m.bias is not None:
                m.bias.data.zero_()
class MHMC(nn.Module):
    def __init__(self, dim, ca_num_heads=4, qkv_bias=True, proj_drop=0., ca_attention=1, expand_ratio=2):
        super().__init__()

        self.ca_attention = ca_attention
        self.dim = dim
        self.ca_num_heads = ca_num_heads

        assert dim % ca_num_heads == 0, f"dim {dim} should be divided by num_heads {ca_num_heads}."

        self.act = nn.GELU()
        self.proj = nn.Linear(dim, dim)
        self.proj_drop = nn.Dropout(proj_drop)

        self.split_groups = self.dim // ca_num_heads

        self.v = nn.Linear(dim, dim, bias=qkv_bias)
        self.s = nn.Linear(dim, dim, bias=qkv_bias)
        for i in range(self.ca_num_heads):
            local_conv = nn.Conv2d(dim // self.ca_num_heads, dim // self.ca_num_heads, kernel_size=(3 + i * 2),
                                   padding=(1 + i), stride=1,
                                   groups=dim // self.ca_num_heads)  # kernel_size 3,5,7,9 大核dw卷積，padding 1,2,3,4
            setattr(self, f"local_conv_{i + 1}", local_conv)
        self.proj0 = nn.Conv2d(dim, dim * expand_ratio, kernel_size=1, padding=0, stride=1,
                               groups=self.split_groups)
        self.bn = nn.BatchNorm2d(dim * expand_ratio)
        self.proj1 = nn.Conv2d(dim * expand_ratio, dim, kernel_size=1, padding=0, stride=1)

        self.apply(self._init_weights)

    def _init_weights(self, m):
        if isinstance(m, nn.Linear):
            trunc_normal_(m.weight, std=.02)
            if isinstance(m, nn.Linear) and m.bias is not None:
                nn.init.constant_(m.bias, 0)
        elif isinstance(m, nn.LayerNorm):
            nn.init.constant_(m.bias, 0)
            nn.init.constant_(m.weight, 1.0)
        elif isinstance(m, nn.Conv2d):
            fan_out = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
            fan_out //= m.groups
            m.weight.data.normal_(0, math.sqrt(2.0 / fan_out))
            if m.bias is not None:
                m.bias.data.zero_()

    def forward(self, x, H, W):
        B, N, C = x.shape
        v = self.v(x)
        s = self.s(x).reshape(B, H, W, self.ca_num_heads, C // self.ca_num_heads).permute(3, 0, 4, 1,
                                                                                          2)  # num_heads,B,C,H,W
        for i in range(self.ca_num_heads):
            local_conv = getattr(self, f"local_conv_{i + 1}")
            s_i = s[i]  # B,C,H,W
            s_i = local_conv(s_i).reshape(B, self.split_groups, -1, H, W)
            if i == 0:
                s_out1 = s_i
            else:
                s_out1 = torch.cat([s_out1, s_i], 2)
        s_out1 = s_out1.reshape(B, C, H, W)

        for i in range(self.ca_num_heads):
            local_conv = getattr(self, f"local_conv_{i + 1}")
            s_i = s[i]  # B,C,H,W
            s_i = local_conv(s_i)
            if i == 0:
                s_out = s_i
            else:
                s_out = torch.cat([s_out, s_i], 1)


        s_out = self.proj1(self.act(self.bn(self.proj0(s_out))))
        self.modulator = s_out
        s_out = s_out.reshape(B, C, N).permute(0, 2, 1)
        x = s_out * v

        x = self.proj(x)
        x = self.proj_drop(x)
        return x



# Multi-scale Awareness Fusion Module
class MAFM(nn.Module):
    def __init__(self, inc):
        super().__init__()
        self.outc = inc
        self.attention = MHMC(dim=inc)
        self.coi = COI(inc)
        self.pw = nn.Sequential(
            nn.Conv2d(in_channels=inc, out_channels=inc, kernel_size=1, stride=1),
            nn.BatchNorm2d(inc),
            nn.GELU()
        )
        self.pre_att = nn.Sequential(
            nn.Conv2d(inc * 2, inc * 2, kernel_size=3, padding=1, groups=inc * 2),
            nn.BatchNorm2d(inc * 2),
            nn.GELU(),
            nn.Conv2d(inc * 2, inc, kernel_size=1),
            nn.BatchNorm2d(inc),
            nn.GELU()
        )

        self.apply(self._init_weights)

    def forward(self, x, d):
        # multi = x * d
        # B, C, H, W = x.shape
        # x_cat = torch.cat((x, d, multi), dim=1)

        B, C, H, W = x.shape
        x_cat = torch.cat((x, d), dim=1)
        x_pre = self.pre_att(x_cat)
        # Attention
        x_reshape = x_pre.flatten(2).permute(0, 2, 1)  # B,C,H,W to B,N,C
        attention = self.attention(x_reshape, H, W)  # attention
        attention = attention.permute(0, 2, 1).reshape(B, C, H, W)  # B,N,C to B,C,H,W

        # COI
        x_conv = self.coi(attention)  # dw3*3,1*1,identity
        x_conv = self.pw(x_conv)  # pw

        return x_conv

    def _init_weights(self, m):
        if isinstance(m, nn.Linear):
            trunc_normal_(m.weight, std=.02)
            if isinstance(m, nn.Linear) and m.bias is not None:
                nn.init.constant_(m.bias, 0)
        elif isinstance(m, nn.LayerNorm):
            nn.init.constant_(m.bias, 0)
            nn.init.constant_(m.weight, 1.0)
        elif isinstance(m, nn.Conv2d):
            fan_out = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
            fan_out //= m.groups
            m.weight.data.normal_(0, math.sqrt(2.0 / fan_out))
            if m.bias is not None:
                m.bias.data.zero_()

if __name__ == '__main__':
    x = torch.randn((1, 4, 9, 9)).cuda()
    d = torch.randn((1, 4, 9, 9)).cuda()
    model = MAFM(inc=4).cuda()
    out = model(x,d)
    print(out.shape)

MHMC模組可以看一下這種做法沒見過

YOLOv3 中的多尺度融合與訓練
2020-11-28
YOLO
多模態融合註記
2020-07-03
非度量多維尺度分析
2018-12-22
多程式Multiprocessing模組
2018-04-16
maven多模組管理
2023-02-10
Maven
智慧駕駛-感知-融合定位IMU
2024-04-16
近似熵-樣本熵-多尺度熵
2020-08-23
熵
混合專家更有主見了，能感知多模態分情況行事，Meta提出模態感知型專家混合
2024-08-11
ICCV 2023 ｜當尺度感知調製遇上Transformer，會碰撞出怎樣的火花？
2023-10-09
ORM
超算與智算融合，中科院團隊構建光伏多時間尺度功率預測模型，可融合氣象資料
2024-10-29
模型
自動駕駛系列（五）——環境感知之純視覺和融合感知
2023-01-31
自動駕駛視覺
解讀：Java 11中的模組感知服務載入器
2019-01-10
Java
springboot-多模組構建
2019-07-19
Spring Boot
SnowRabbit全家桶-Laravel多模組
2020-09-15
Laravel
Android模組化與元件化–多模組區分編譯
2019-03-04
Android元件化編譯
vue多專案多模組執行/打包
2021-09-28
Vue
多模態融合(四)Generative Visual Dialogue System viaWeighted Likelihood Estimation
2020-11-15
Go 1.18 新特性多模組工作區教程-讓多模組開發變得簡單
2022-03-21
Go
Android 元件化之通訊（多模組，多程式）
2019-03-01
Android元件化
Springboot建立maven多模組專案
2020-09-27
Spring BootMaven
Android元件化開發案例（融合數10個專案模組）
2019-04-28
Android元件化
SpringBoot多模組專案中無法注入其他模組中的spring bean
2020-12-04
Spring BootBean
空間蛋白質組學：構建複雜組織的尺度圖譜
2024-12-24
python之 threading（多執行緒）模組
2020-05-04
Pythonthread執行緒
如何繫結多個後臺模組
2020-04-04
SpringBoot - 多模組專案的搭建教程
2020-12-02
Spring Boot
序列化模組，隨機數模組，os模組，sys模組，hashlib模組
2019-03-19
隨機
IDEA建立SpringBoot的多模組專案教程
2020-06-27
IdeaSpring Boot
如何構建多模組的SpringBoot專案
2019-05-13
Spring Boot
Spring Boot + MyBatis 多模組專案搭建教程
2021-11-21
Spring BootMyBatis
Java技術分享：SpringBoot多模組開發
2021-05-18
JavaSpring Boot
laravel 多模組模式下進行開發
2021-03-08
Laravel模式
Docker：Docker部署Jenkins並共用宿主機Docker部署微服務多模組（二）構建微服務後端多模組
2024-11-23
DockerJenkins微服務後端
[深度學習]多層感知機（MLP）
2024-04-13
深度學習
Spring Boot - 多模組多環境配置，大廠必備技能
2020-10-30
Spring Boot
python 模組：itsdangerous 模組
2020-02-16
Python
path模組 fs模組
2020-11-09
Python模組：time模組
2021-09-09
Python

MAGNet -MAFM 多尺度感知融合模組

相關文章