条件卷积的运算过程

就是用多个卷积核进行聚合组成一个卷积核。

import torch

from torch import nn

import torch.nn.functional as F

from torch import nn

from torch.nn.modules.conv import _ConvNd

from torch.nn.modules.utils import _pair

from torch.nn.parameter import Parameter

import numpy as np

import functools

class _routing(nn.Module):

def __init__(self, in_channels, num_experts, dropout_rate):

super(_routing, self).__init__()

self.fc = nn.Linear(in_channels, num_experts)

def forward(self, x):

x = torch.flatten(x)

x = self.fc(x)

return F.softmax(x,dim=0)

class CondConv2D(_ConvNd):

r"""Learn specialized convolutional kernels for each example.

As described in the paper

`CondConv: Conditionally Parameterized Convolutions for Efficient Inference`_ ,

conditionally parameterized convolutions (CondConv),

which challenge the paradigm of static convolutional kernels

by computing convolutional kernels as a function of the input.

Args:

in_channels (int): Number of channels in the input image

out_channels (int): Number of channels produced by the convolution

kernel_size (int or tuple): Size of the convolving kernel

stride (int or tuple, optional): Stride of the convolution. Default: 1

padding (int or tuple, optional): Zero-padding added to both sides of the input. Default: 0

padding_mode (string, optional): ``'zeros'``, ``'reflect'``, ``'replicate'`` or ``'circular'``. Default: ``'zeros'``

dilation (int or tuple, optional): Spacing between kernel elements. Default: 1

groups (int, optional): Number of blocked connections from input channels to output channels. Default: 1

bias (bool, optional): If ``True``, adds a learnable bias to the output. Default: ``True``

num_experts (int): Number of experts per layer

Shape:

- Input: :math:`(N, C_{in}, H_{in}, W_{in})`

- Output: :math:`(N, C_{out}, H_{out}, W_{out})` where

.. math::

H_{out} = \left\lfloor\frac{H_{in} + 2 \times \text{padding}[0] - \text{dilation}[0]

\times (\text{kernel\_size}[0] - 1) - 1}{\text{stride}[0]} + 1\right\rfloor

.. math::

W_{out} = \left\lfloor\frac{W_{in} + 2 \times \text{padding}[1] - \text{dilation}[1]

\times (\text{kernel\_size}[1] - 1) - 1}{\text{stride}[1]} + 1\right\rfloor

Attributes:

weight (Tensor): the learnable weights of the module of shape

:math:`(\text{out\_channels}, \frac{\text{in\_channels}}{\text{groups}},`

:math:`\text{kernel\_size[0]}, \text{kernel\_size[1]})`.

The values of these weights are sampled from

:math:`\mathcal{U}(-\sqrt{k}, \sqrt{k})` where

:math:`k = \frac{groups}{C_\text{in} * \prod_{i=0}^{1}\text{kernel\_size}[i]}`

bias (Tensor): the learnable bias of the module of shape (out_channels). If :attr:`bias` is ``True``,

then the values of these weights are

sampled from :math:`\mathcal{U}(-\sqrt{k}, \sqrt{k})` where

:math:`k = \frac{groups}{C_\text{in} * \prod_{i=0}^{1}\text{kernel\_size}[i]}`

.. _CondConv: Conditionally Parameterized Convolutions for Efficient Inference:

https://arxiv.org/abs/1904.04971

"""

def __init__(self, in_channels, out_channels, kernel_size, stride=1,

padding=0, dilation=1, groups=1,

bias=True, padding_mode='zeros', num_experts=3, dropout_rate=0.2):

kernel_size = _pair(kernel_size)

stride = _pair(stride)

padding = _pair(padding)

dilation = _pair(dilation)

super(CondConv2D, self).__init__(

in_channels, out_channels, kernel_size, stride, padding, dilation,

False, _pair(0), groups, bias, padding_mode)

self._avg_pooling = functools.partial(F.adaptive_avg_pool2d, output_size=(1, 1))

self._routing_fn = _routing(in_channels, num_experts, dropout_rate)

self.weight = Parameter(torch.Tensor(

num_experts, out_channels, in_channels // groups, *kernel_size))

self.reset_parameters()

def _conv_forward(self, input, weight):

if self.padding_mode != 'zeros':

return F.conv2d(F.pad(input, self._padding_repeated_twice, mode=self.padding_mode),

weight, self.bias, self.stride,

_pair(0), self.dilation, self.groups)

return F.conv2d(input, weight, self.bias, self.stride,

self.padding, self.dilation, self.groups)

def forward(self, inputs):

b, _, _, _ = inputs.size()

res = []

for input in inputs:

input = input.unsqueeze(0)

pooled_inputs = self._avg_pooling(input)

routing_weights = self._routing_fn(pooled_inputs)

print(self.weight)

routing_weights=torch.ones(3)

kernels = torch.sum(routing_weights[: ,None, None, None, None] * self.weight, 0)

print(kernels)

out = self._conv_forward(input, kernels)

res.append(out)

return torch.cat(res, dim=0)

c=CondConv2D(1,2,2)

x=torch.randn(1,1,2,2)

print(c(x))

pytorch代码。

生成多组并行的卷积层，将这些并行的卷积层合并成一个卷积层，一个通道一个通道合并。

posted @ 2022-04-14 10:46 祥瑞哈哈哈阅读(120) 评论(0) 编辑收藏举报

刷新页面返回顶部

登录后才能查看或发表评论，立即登录或者逛逛博客园首页

相关博文：

· pytorch训练神经网络以及L1和L2正则化约束神经网络并展示网络权重

· 残差加se块pytorch实现

· 深度学习卷积(Convolution)

· 深度学习（八）——神经网络：卷积层

· ConvTranspose2d

阅读排行：
· Manus爆火，是硬核还是营销？
· 终于写完轮子一部分：tcp代理了，记录一下
· 别再用vector＜bool＞了！Google高级工程师：这可能是STL最大的设计失误
· 单元测试从入门到精通
· 震惊！C++程序真的从main开始吗？99%的程序员都答错了

公告

昵称：祥瑞哈哈哈
园龄： 3年9个月
粉丝： 2
关注： 0

+加关注

2025年3月

日

一

二

三

四

五

六

祥瑞哈哈哈

条件卷积的运算过程

公告

搜索

常用链接

合集

随笔分类

随笔档案

阅读排行榜

评论排行榜

推荐排行榜

最新评论