class OrientedASPP(nn.Module): def __init__(self, dim_in, dim_out, rate=1): super().__init__() # 方向滤波器组：0°, 45°, 90°, 135° self.conv_arrange = nn.Sequential( nn.AdaptiveAvgPool2d(1), nn.Conv2d(dim_in, dim_out, 1, 1, 0, bias=True), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True) ) self.branch1 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 1, 1, padding=0, dilation=rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.branch2 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=6 * rate, dilation=6 * rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.branch3 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=12 * rate, dilation=12 * rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.branch4 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=18 * rate, dilation=18 * rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.orient_att = nn.Sequential( # 方向注意力 nn.Conv2d(4 * dim_out, 4, 1), nn.Softmax(dim=1) ) def forward(self, x): feats = [] branch1 = self.branch1(x) branch2 = self.branch2(x) branch3 = self.branch3(x) branch4 = self.branch4(x) feats.append(branch1) feats.append(branch2) feats.append(branch3) feats.append(branch4) fused = torch.cat(feats, dim=1) att = self.orient_att(fused) # [N,4,H,W] # 方向加权融合 return sum([att[:, i:i + 1] * feats for i in range(4)])报错TypeError: only integer tensors of a single element can be converted to an index如何解决_OrientedASPP module implementation_

class DynamicRateASPP(nn.Module): def init(self, dim_in, dim_out, rate=1, bn_mom=0.1): super(DynamicRateASPP, self).init() self.dim_in = dim_in self.dim_out = dim_out self.rate = rate self.bn_mom = bn_mom # 用于预测膨胀率的网络 self.rate_predictor = nn.Sequential( nn.AdaptiveAvgPool2d(1), nn.Flatten(), nn.Linear(dim_in, 4), nn.Softmax(dim=1) ) self.base_branch1 = nn.Conv2d(dim_in, dim_out, 1, 1, padding=0, bias=True) self.base_branch2 = nn.Conv2d(dim_in, dim_out, 3, 1, bias=True) self.base_branch3 = nn.Conv2d(dim_in, dim_out, 3, 1, bias=True) self.base_branch4 = nn.Conv2d(dim_in, dim_out, 3, 1, bias=True) self.bn1 = nn.BatchNorm2d(dim_out, momentum=bn_mom) self.bn2 = nn.BatchNorm2d(dim_out, momentum=bn_mom) self.bn3 = nn.BatchNorm2d(dim_out, momentum=bn_mom) self.bn4 = nn.BatchNorm2d(dim_out, momentum=bn_mom

def __init__(self, in_channels, out_channels=256): super().__init__() rates = [1, 3, 6, 9] self.convs = nn.ModuleList([ nn.Sequential( nn.Conv2d(in_channels, out_channels, 3, padding=r, ...

""" This part contains UNet series models, including UNet, R2UNet, Attention UNet, R2Attention UNet, DenseUNet """ import torch import torch.nn as nn import torch.nn.functional as F from torch.nn import init # ==========================Core Module================================ class conv_block(nn.Module): def init(self, ch_in, ch_out): super(conv_block, self).init() self.conv = nn.Sequential( nn.Conv2d(ch_in, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True), nn.Conv2d(ch_out, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True) ) def forward(self, x): x = self.conv(x) return x class up_conv(nn.Module): def init(self, ch_in, ch_out): super(up_conv, self).init() self.up = nn.Sequential( nn.Upsample(scale_factor=2), nn.Conv2d(ch_in, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True) ) def forward(self, x): x = self.up(x) return x class Recurrent_block(nn.Module): def init(self, ch_out, t=2): super(Recurrent_block, self).init() self.t = t self.ch_out = ch_out self.conv = nn.Sequential( nn.Conv2d(ch_out, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True) ) def forward(self, x): for i in range(self.t): if i == 0: x1 = self.conv(x) x1 = self.conv(x + x1) return x1 class RRCNN_block(nn.Module): def init(self, ch_in, ch_out, t=2): super(RRCNN_block, self).init() self.RCNN = nn.Sequential( Recurrent_block(ch_out, t=t), Recurrent_block(ch_out, t=t) ) self.Conv_1x1 = nn.Conv2d(ch_in, ch_out, kernel_size=1, stride=1, padding=0) def forward(self, x): x = self.Conv_1x1(x) x1 = self.RCNN(x) return x + x1 class single_conv(nn.Module): def init(self, ch_in, ch_out): super(single_conv, self).init() self.conv = nn.Sequential( nn.Conv2d(ch_in, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True) ) def forward(self, x): x = self.conv(x) return x class Attention_block(nn.Module): # attention Gate def init(self, F_g, F_l, F_int): super(Attention_block, self).init() self.W_g = nn.Sequential( nn.Conv2d(F_g, F_int, kernel_size=1, stride=1, padding=0, bias=True), nn.BatchNorm2d(F_int) ) self.W_x = nn.Sequential( nn.Conv2d(F_l, F_int, kernel_size=1, stride=1, padding=0, bias=True), nn.BatchNorm2d(F_int) ) self.psi = nn.Sequential( nn.Conv2d(F_int, 1, kernel_size=1, stride=1, padding=0, bias=True), nn.BatchNorm2d(1), nn.Sigmoid() ) self.relu = nn.ReLU(inplace=True) def forward(self, g, x): g1 = self.W_g(g) x1 = self.W_x(x) psi = self.relu(g1 + x1) psi = self.psi(psi) return x * psi # ================================================================== class U_Net(nn.Module): def init(self, img_ch=3, output_ch=1): super(U_Net, self).init() self.Maxpool = nn.MaxPool2d(kernel_size=2, stride=2) self.Conv1 = conv_block(ch_in=img_ch, ch_out=64) self.Conv2 = conv_block(ch_in=64, ch_out=128) self.Conv3 = conv_block(ch_in=128, ch_out=256) self.Conv4 = conv_block(ch_in=256, ch_out=512) self.Conv5 = conv_block(ch_in=512, ch_out=1024) self.Up5 = up_conv(ch_in=1024, ch_out=512) self.Up_conv5 = conv_block(ch_in=1024, ch_out=512) self.Up4 = up_conv(ch_in=512, ch_out=256) self.Up_conv4 = conv_block(ch_in=512, ch_out=256) self.Up3 = up_conv(ch_in=256, ch_out=128) self.Up_conv3 = conv_block(ch_in=256, ch_out=128) self.Up2 = up_conv(ch_in=128, ch_out=64) self.Up_conv2 = conv_block(ch_in=128, ch_out=64) self.Conv_1x1 = nn.Conv2d(64, output_ch, kernel_size=1, stride=1, padding=0) def forward(self, x): # encoding path x1 = self.Conv1(x) x2 = self.Maxpool(x1) x2 = self.Conv2(x2) x3 = self.Maxpool(x2) x3 = self.Conv3(x3) x4 = self.Maxpool(x3) x4 = self.Conv4(x4) x5 = self.Maxpool(x4) x5 = self.Conv5(x5) # decoding + concat path d5 = self.Up5(x5) d5 = torch.cat((x4, d5), dim=1) d5 = self.Up_conv5(d5) d4 = self.Up4(d5) d4 = torch.cat((x3, d4), dim=1) d4 = self.Up_conv4(d4) d3 = self.Up3(d4) d3 = torch.cat((x2, d3), dim=1) d3 = self.Up_conv3(d3) d2 = self.Up2(d3) d2 = torch.cat((x1, d2), dim=1) d2 = self.Up_conv2(d2) d1 = self.Conv_1x1(d2) d1 = F.softmax(d1,dim=1) # mine return d1 # ============================================================ class R2U_Net(nn.Module): def init(self, img_ch=3, output_ch=1, t=2): super(R2U_Net, self).init() self.Maxpool = nn.MaxPool2d(kernel_size=2, stride=2) self.Upsample = nn.Upsample(scale_factor=2) self.RRCNN1 = RRCNN_block(ch_in=img_ch, ch_out=64, t=t) self.RRCNN2 = RRCNN_block(ch_in=64, ch_out=128, t=t) self.RRCNN3 = RRCNN_block(ch_in=128, ch_out=256, t=t) self.RRCNN4 = RRCNN_block(ch_in=256, ch_out=512, t=t) self.RRCNN5 = RRCNN_block(ch_in=512, ch_out=1024, t=t) self.Up5 = up_conv(ch_in=1024, ch_out=512) self.Up_RRCNN5 = RRCNN_block(ch_in=1024, ch_out=512, t=t) self.Up4 = up_conv(ch_in=512, ch_out=256) self.Up_RRCNN4 = RRCNN_block(ch_in=512, ch_out=256, t=t) self.Up3 = up_conv(ch_in=256, ch_out=128) self.Up_RRCNN3 = RRCNN_block(ch_in=256, ch_out=128, t=t) self.Up2 = up_conv(ch_in=128, ch_out=64) self.Up_RRCNN2 = RRCNN_block(ch_in=128, ch_out=64, t=t) self.Conv_1x1 = nn.Conv2d(64, output_ch, kernel_size=1, stride=1, padding=0) def forward(self, x): # encoding path x1 = self.RRCNN1(x) x2 = self.Maxpool(x1) x2 = self.RRCNN2(x2) x3 = self.Maxpool(x2) x3 = self.RRCNN3(x3) x4 = self.Maxpool(x3) x4 = self.RRCNN4(x4) x5 = self.Maxpool(x4) x5 = self.RRCNN5(x5) # decoding + concat path d5 = self.Up5(x5) d5 = torch.cat((x4, d5), dim=1) d5 = self.Up_RRCNN5(d5) d4 = self.Up4(d5) d4 = torch.cat((x3, d4), dim=1) d4 = self.Up_RRCNN4(d4) d3 = self.Up3(d4) d3 = torch.cat((x2, d3), dim=1) d3 = self.Up_RRCNN3(d3) d2 = self.Up2(d3) d2 = torch.cat((x1, d2), dim=1) d2 = self.Up_RRCNN2(d2) d1 = self.Conv_1x1(d2) d1 = F.softmax(d1,dim=1) return d1 # =========================================================== class AttU_Net(nn.Module): def init(self, img_ch=3, output_ch=1): super(AttU_Net, self).init() self.Maxpool = nn.MaxPool2d(kernel_size=2, stride=2) self.Conv1 = conv_block(ch_in=img_ch, ch_out=64) self.Conv2 = conv_block(ch_in=64, ch_out=128) self.Conv3 = conv_block(ch_in=128, ch_out=256) self.Conv4 = conv_block(ch_in=256, ch_out=512) self.Conv5 = conv_block(ch_in=512, ch_out=1024) self.Up5 = up_conv(ch_in=1024, ch_out=512) self.Att5 = Attention_block(F_g=512, F_l=512, F_int=256) self.Up_conv5 = conv_block(ch_in=1024, ch_out=512) self.Up4 = up_conv(ch_in=512, ch_out=256) self.Att4 = Attention_block(F_g=256, F_l=256, F_int=128) self.Up_conv4 = conv_block(ch_in=512, ch_out=256) self.Up3 = up_conv(ch_in=256, ch_out=128) self.Att3 = Attention_block(F_g=128, F_l=128, F_int=64) self.Up_conv3 = conv_block(ch_in=256, ch_out=128) self.Up2 = up_conv(ch_in=128, ch_out=64) self.Att2 = Attention_block(F_g=64, F_l=64, F_int=32) self.Up_conv2 = conv_block(ch_in=128, ch_out=64) self.Conv_1x1 = nn.Conv2d(64, output_ch, kernel_size=1, stride=1, padding=0) def forward(self, x): # encoding path x1 = self.Conv1(x) x2 = self.Maxpool(x1) x2 = self.Conv2(x2) x3 = self.Maxpool(x2) x3 = self.Conv3(x3) x4 = self.Maxpool(x3) x4 = self.Conv4(x4) x5 = self.Maxpool(x4) x5 = self.Conv5(x5) # decoding + concat path d5 = self.Up5(x5) x4 = self.Att5(g=d5, x=x4) d5 = torch.cat((x4, d5), dim=1) d5 = self.Up_conv5(d5) d4 = self.Up4(d5) x3 = self.Att4(g=d4, x=x3) d4 = torch.cat((x3, d4), dim=1) d4 = self.Up_conv4(d4) d3 = self.Up3(d4) x2 = self.Att3(g=d3, x=x2) d3 = torch.cat((x2, d3), dim=1) d3 = self.Up_conv3(d3) d2 = self.Up2(d3) x1 = self.Att2(g=d2, x=x1) d2 = torch.cat((x1, d2), dim=1) d2 = self.Up_conv2(d2) d1 = self.Conv_1x1(d2) d1 = F.sigmoid(d1) return d1 # =========================================================== class ChannelAttention(nn.Module): def init(self, channel, reduction=16): super(ChannelAttention, self).init() self.avg_pool = nn.AdaptiveAvgPool2d(1) self.max_pool = nn.AdaptiveMaxPool2d(1) self.fc = nn.Sequential( nn.Conv2d(channel, channel // reduction, 1, bias=False), nn.ReLU(inplace=True), nn.Conv2d(channel // reduction, channel, 1, bias=False) ) self.sigmoid = nn.Sigmoid() def forward(self, x): avg_out = self.fc(self.avg_pool(x)) max_out = self.fc(self.max_pool(x)) out = avg_out + max_out return self.sigmoid(out) * x class conv_block(nn.Module): def init(self, ch_in, ch_out): super(conv_block, self).init() self.conv = nn.Sequential( nn.Conv2d(ch_in, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True), nn.Conv2d(ch_out, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True) ) def forward(self, x): x = self.conv(x) return x class up_conv(nn.Module): def init(self, ch_in, ch_out): super(up_conv, self).init() self.up = nn.Sequential( nn.Upsample(scale_factor=2), nn.Conv2d(ch_in, ch_out, kernel_size=3, stride=1, padding=1, bias=True), nn.BatchNorm2d(ch_out), nn.ReLU(inplace=True) ) def forward(self, x): x = self.up(x) return x class Attention_block(nn.Module): def init(self, F_g, F_l, F_int): super(Attention_block, self).init() self.W_g = nn.Sequential( nn.Conv2d(F_g, F_int, kernel_size=1, stride=1, padding=0, bias=True), nn.BatchNorm2d(F_int) ) self.W_x = nn.Sequential( nn.Conv2d(F_l, F_int, kernel_size=1, stride=1, padding=0, bias=True), nn.BatchNorm2d(F_int) ) self.psi = nn.Sequential( nn.Conv2d(F_int, 1, kernel_size=1, stride=1, padding=0, bias=True), nn.BatchNorm2d(1), nn.Sigmoid() ) self.relu = nn.ReLU(inplace=True) def forward(self, g, x): g1 = self.W_g(g) x1 = self.W_x(x) psi = self.relu(g1 + x1) psi = self.psi(psi) return x * psi class CSAU_Net(nn.Module): def init(self, img_ch=3, output_ch=1): super(CSAU_Net, self).init() self.Maxpool = nn.MaxPool2d(kernel_size=2, stride=2) self.Conv1 = conv_block(ch_in=img_ch, ch_out=64) self.CA1 = ChannelAttention(channel=64) self.Conv2 = conv_block(ch_in=64, ch_out=128) self.CA2 = ChannelAttention(channel=128) self.Conv3 = conv_block(ch_in=128, ch_out=256) self.CA3 = ChannelAttention(channel=256) self.Conv4 = conv_block(ch_in=256, ch_out=512) self.CA4 = ChannelAttention(channel=512) self.Conv5 = conv_block(ch_in=512, ch_out=1024) self.CA5 = ChannelAttention(channel=1024) self.Up5 = up_conv(ch_in=1024, ch_out=512) self.Att5 = Attention_block(F_g=512, F_l=512, F_int=256) self.Up_conv5 = conv_block(ch_in=1024, ch_out=512) self.CA_Up5 = ChannelAttention(channel=512) self.Up4 = up_conv(ch_in=512, ch_out=256) self.Att4 = Attention_block(F_g=256, F_l=256, F_int=128) self.Up_conv4 = conv_block(ch_in=512, ch_out=256) self.CA_Up4 = ChannelAttention(channel=256) self.Up3 = up_conv(ch_in=256, ch_out=128) self.Att3 = Attention_block(F_g=128, F_l=128, F_int=64) self.Up_conv3 = conv_block(ch_in=256, ch_out=128) self.CA_Up3 = ChannelAttention(channel=128) self.Up2 = up_conv(ch_in=128, ch_out=64) self.Att2 = Attention_block(F_g=64, F_l=64, F_int=32) self.Up_conv2 = conv_block(ch_in=128, ch_out=64) self.CA_Up2 = ChannelAttention(channel=64) self.Conv_1x1 = nn.Conv2d(64, output_ch, kernel_size=1, stride=1, padding=0) def forward(self, x): # 编码路径 x1 = self.Conv1(x) x1 = self.CA1(x1) x2 = self.Maxpool(x1) x2 = self.Conv2(x2) x2 = self.CA2(x2) x3 = self.Maxpool(x2) x3 = self.Conv3(x3) x3 = self.CA3(x3) x4 = self.Maxpool(x3) x4 = self.Conv4(x4) x4 = self.CA4(x4) x5 = self.Maxpool(x4) x5 = self.Conv5(x5) x5 = self.CA5(x5) # 解码路径 + 连接路径 d5 = self.Up5(x5) x4 = self.Att5(g=d5, x=x4) d5 = torch.cat((x4, d5), dim=1) d5 = self.Up_conv5(d5) d5 = self.CA_Up5(d5) d4 = self.Up4(d5) x3 = self.Att4(g=d4, x=x3) d4 = torch.cat((x3, d4), dim=1) d4 = self.Up_conv4(d4) d4 = self.CA_Up4(d4) d3 = self.Up3(d4) x2 = self.Att3(g=d3, x=x2) d3 = torch.cat((x2, d3), dim=1) d3 = self.Up_conv3(d3) d3 = self.CA_Up3(d3) d2 = self.Up2(d3) x1 = self.Att2(g=d2, x=x1) d2 = torch.cat((x1, d2), dim=1) d2 = self.Up_conv2(d2) d2 = self.CA_Up2(d2) d1 = self.Conv_1x1(d2) d1 = F.sigmoid(d1) return d1 from torchsummary import summary if name == 'main': model = AttU_Net(3,1).to('cuda') summary(model, input_size=(3, 128, 128)) #EOF

def __init__(self, in_ch=3, out_ch=1): super().__init__() # 编码器 self.down1 = DoubleConv(in_ch, 64) self.down2 = DoubleConv(64, 128) self.down3 = DoubleConv(128, 256) self.down4 = DoubleConv...

class ACmix(nn.Module): def init(self, in_planes, out_planes, kernel_att=7, head=4, kernel_conv=3, stride=1, dilation=1): super(ACmix, self).init() self.in_planes = in_planes self.out_planes = out_planes self.head = head self.kernel_att = kernel_att self.kernel_conv = kernel_conv self.stride = stride self.dilation = dilation self.rate1 = torch.nn.Parameter(torch.Tensor(1)) self.rate2 = torch.nn.Parameter(torch.Tensor(1)) self.head_dim = self.out_planes // self.head self.conv1 = nn.Conv2d(in_planes, out_planes, kernel_size=1) self.conv2 = nn.Conv2d(in_planes, out_planes, kernel_size=1) self.conv3 = nn.Conv2d(in_planes, out_planes, kernel_size=1) self.conv_p = nn.Conv2d(2, self.head_dim, kernel_size=1) self.padding_att = (self.dilation * (self.kernel_att - 1) + 1) // 2 self.pad_att = torch.nn.ReflectionPad2d(self.padding_att) self.unfold = nn.Unfold(kernel_size=self.kernel_att, padding=0, stride=self.stride) self.softmax = torch.nn.Softmax(dim=1) self.fc = nn.Conv2d(3 * self.head, self.kernel_conv * self.kernel_conv, kernel_size=1, bias=False) self.dep_conv = nn.Conv2d(self.kernel_conv * self.kernel_conv * self.head_dim, out_planes, kernel_size=self.kernel_conv, bias=True, groups=self.head_dim, padding=1, stride=stride) self.reset_parameters()逐行解释代码

def __init__(self, in_planes, out_planes, kernel_att=7, head=4, kernel_conv=3, stride=1, dilation=1): super(ACmix, self).__init__() 定义ACmix类，其中包含了初始化函数__init__()。其中in_planes...

class HetGraphSAGE(torch.nn.Module): def init(self, nfeat1, nfeat2, nhid, out_dim, gamma=0.5, drop_rate=0): super().init() self.Linear1 = nn.Linear(nfeat1, nhid) self.Linear2 = nn.Linear(nfeat2, nhid) self.SAGE1 = SAGEConvLayer(nhid, nhid) self.SAGE1_2 = SAGEConvLayer(nhid, nhid) self.SAGE2 = SAGEConvLayer(nhid, nhid) self.SAGE2_2 = SAGEConvLayer(nhid, nhid) self.outLinear = nn.Linear(nhid, out_dim) self.gamma = gamma self.dropout = drop_rate这里的out_dim不用自己赋值吗

是的，您需要为out_dim赋一个值，否则会报错。...其中nfeat1和nfeat2是输入特征的维度，nhid是隐藏层维度，gamma是SAGEConvLayer中的参数，drop_rate是dropout的概率，out_dim是您指定的输出维度。

def gcd(a, b): while b: a, b = b, a % b return a # Other types of layers can go here (e.g., nn.Linear, etc.) def _init_weights(module, name, scheme=''): if isinstance(module, nn.Conv2d) or isinstance(module, nn.Conv3d): if scheme == 'normal': nn.init.normal_(module.weight, std=.02) if module.bias is not None: nn.init.zeros_(module.bias) elif scheme == 'trunc_normal': trunc_normal_tf_(module.weight, std=.02) if module.bias is not None: nn.init.zeros_(module.bias) elif scheme == 'xavier_normal': nn.init.xavier_normal_(module.weight) if module.bias is not None: nn.init.zeros_(module.bias) elif scheme == 'kaiming_normal': nn.init.kaiming_normal_(module.weight, mode='fan_out', nonlinearity='relu') if module.bias is not None: nn.init.zeros_(module.bias) else: # efficientnet like fan_out = module.kernel_size[0] * module.kernel_size[1] * module.out_channels fan_out //= module.groups nn.init.normal_(module.weight, 0, math.sqrt(2.0 / fan_out)) if module.bias is not None: nn.init.zeros_(module.bias) elif isinstance(module, nn.BatchNorm2d) or isinstance(module, nn.BatchNorm3d): nn.init.constant_(module.weight, 1) nn.init.constant_(module.bias, 0) elif isinstance(module, nn.LayerNorm): nn.init.constant_(module.weight, 1) nn.init.constant_(module.bias, 0) def act_layer(act, inplace=False, neg_slope=0.2, n_prelu=1): # activation layer act = act.lower() if act == 'relu': layer = nn.ReLU(inplace) elif act == 'relu6': layer = nn.ReLU6(inplace) elif act == 'leakyrelu': layer = nn.LeakyReLU(neg_slope, inplace) elif act == 'prelu': layer = nn.PReLU(num_parameters=n_prelu, init=neg_slope) elif act == 'gelu': layer = nn.GELU() elif act == 'hswish': layer = nn.Hardswish(inplace) else: raise NotImplementedError('activation layer [%s] is not found' % act) return layer def channel_shuffle(x, groups): batchsize, num_channels, height, width = x.data.size() channels_per_group = num_channels // groups # reshape x = x.view(batchsize, groups, channels_per_group, height, width) x = torch.transpose(x, 1, 2).contiguous() # flatten x = x.view(batchsize, -1, height, width) return x # Multi-scale depth-wise convolution (MSDC) class MSDC(nn.Module): def init(self, in_channels, kernel_sizes, stride, activation='relu6', dw_parallel=True): super(MSDC, self).init() self.in_channels = in_channels self.kernel_sizes = kernel_sizes self.activation = activation self.dw_parallel = dw_parallel self.dwconvs = nn.ModuleList([ nn.Sequential( nn.Conv2d(self.in_channels, self.in_channels, kernel_size, stride, kernel_size // 2, groups=self.in_channels, bias=False), nn.BatchNorm2d(self.in_channels), act_layer(self.activation, inplace=True) ) for kernel_size in self.kernel_sizes ]) self.init_weights('normal') def init_weights(self, scheme=''): named_apply(partial(_init_weights, scheme=scheme), self) def forward(self, x): # Apply the convolution layers in a loop outputs = [] for dwconv in self.dwconvs: dw_out = dwconv(x) outputs.append(dw_out) if self.dw_parallel == False: x = x + dw_out # You can return outputs based on what you intend to do with them return outputs class MSCB(nn.Module): """ Multi-scale convolution block (MSCB) """ def init(self, in_channels, out_channels, shortcut=False, stride=1, kernel_sizes=[1, 3, 5], expansion_factor=2, dw_parallel=True, activation='relu6'): super(MSCB, self).init() add = shortcut self.in_channels = in_channels self.out_channels = out_channels self.stride = stride self.kernel_sizes = kernel_sizes self.expansion_factor = expansion_factor self.dw_parallel = dw_parallel self.add = add self.activation = activation self.n_scales = len(self.kernel_sizes) # check stride value assert self.stride in [1, 2] # Skip connection if stride is 1 self.use_skip_connection = True if self.stride == 1 else False # expansion factor self.ex_channels = int(self.in_channels * self.expansion_factor) self.pconv1 = nn.Sequential( # pointwise convolution nn.Conv2d(self.in_channels, self.ex_channels, 1, 1, 0, bias=False), nn.BatchNorm2d(self.ex_channels), act_layer(self.activation, inplace=True) ) self.msdc = MSDC(self.ex_channels, self.kernel_sizes, self.stride, self.activation, dw_parallel=self.dw_parallel) if self.add == True: self.combined_channels = self.ex_channels * 1 else: self.combined_channels = self.ex_channels * self.n_scales self.pconv2 = nn.Sequential( # pointwise convolution nn.Conv2d(self.combined_channels, self.out_channels, 1, 1, 0, bias=False), nn.BatchNorm2d(self.out_channels), ) if self.use_skip_connection and (self.in_channels != self.out_channels): self.conv1x1 = nn.Conv2d(self.in_channels, self.out_channels, 1, 1, 0, bias=False) self.init_weights('normal') def init_weights(self, scheme=''): named_apply(partial(_init_weights, scheme=scheme), self) def forward(self, x): pout1 = self.pconv1(x) msdc_outs = self.msdc(pout1) if self.add == True: dout = 0 for dwout in msdc_outs: dout = dout + dwout else: dout = torch.cat(msdc_outs, dim=1) dout = channel_shuffle(dout, gcd(self.combined_channels, self.out_channels)) out = self.pconv2(dout) if self.use_skip_connection: if self.in_channels != self.out_channels: x = self.conv1x1(x) return x + out else: return out def autopad(k, p=None, d=1): # kernel, padding, dilation """Pad to 'same' shape outputs.""" if d > 1: k = d * (k - 1) + 1 if isinstance(k, int) else [d * (x - 1) + 1 for x in k] # actual kernel-size if p is None: p = k // 2 if isinstance(k, int) else [x // 2 for x in k] # auto-pad return p class Conv(nn.Module): """Standard convolution with args(ch_in, ch_out, kernel, stride, padding, groups, dilation, activation).""" default_act = nn.SiLU() # default activation def init(self, c1, c2, k=1, s=1, p=None, g=1, d=1, act=True): """Initialize Conv layer with given arguments including activation.""" super().init() self.conv = nn.Conv2d(c1, c2, k, s, autopad(k, p, d), groups=g, dilation=d, bias=False) self.bn = nn.BatchNorm2d(c2) self.act = self.default_act if act is True else act if isinstance(act, nn.Module) else nn.Identity() def forward(self, x): """Apply convolution, batch normalization and activation to input tensor.""" return self.act(self.bn(self.conv(x))) def forward_fuse(self, x): """Perform transposed convolution of 2D data.""" return self.act(self.conv(x)) import torch from torch import nn from ultralytics.nn.modules.conv import Conv from torch.nn import functional as F class Channel_Att(nn.Module): def init(self, channels, t=16): super(Channel_Att, self).init() self.channels = channels self.bn2 = nn.BatchNorm2d(self.channels, affine=True) def forward(self, x): residual = x x = self.bn2(x) weight_bn = self.bn2.weight.data.abs() / torch.sum(self.bn2.weight.data.abs()) x = x.permute(0, 2, 3, 1).contiguous() x = torch.mul(weight_bn, x) x = x.permute(0, 3, 1, 2).contiguous() x = torch.sigmoid(x) * residual # return x class NAMAttention(nn.Module): def init(self, channels, shape, out_channels=None, no_spatial=True): super(NAMAttention, self).init() self.Channel_Att = Channel_Att(channels) def forward(self, x): x_out1 = self.Channel_Att(x) return x_out1 根据这些代码，参考Conv的结构，创建一个名为MSConv的模块，输入分为两个分支，第一个是MSDC模块到BatchNorm2d到SiLU，另一个是NAM注意力，注意力机制与其他三个模块并行，最后将SiLU的输出与NAM的输出合并为最终的输出。请编辑代码实现这个思路。注意NAM注意力机制的参数问题

def __init__(self, in_channels): super(SpatialAttention, self).__init__() self.bn = nn.BatchNorm2d(in_channels, affine=True) def forward(self, x): residual = x x = self.bn(x) # 提取gamma（缩放...

import numpy as np from resnet import resnet50 import torch import torch.nn as nn from densenet3D import DenseNet3D from vit3D import ViT class AttentionFusion(nn.Module): def init(self, input_dim, hidden_dim): super(AttentionFusion, self).init() # Attention layers self.attention = nn.Sequential( nn.Linear(input_dim * 2, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 2), nn.Softmax(dim=1) ) def forward(self, feat1, feat2): combined_feat = torch.cat((feat1, feat2), dim=1) weights = self.attention(combined_feat) feat_fused = weights[:, 0:1] * feat1 + weights[:, 1:2] * feat2 return feat_fused class ImageFusionModel(nn.Module): def init(self, img_encoder = 'resnet50', device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')): super(ImageFusionModel, self).init() self.img_encoder = img_encoder if img_encoder == 'resnet50': self.DWI_ImgEncoder = resnet50().to(device) self.T2_ImgEncoder = resnet50().to(device) input_dim = 2048 elif img_encoder == 'vit': self.DWI_ImgEncoder = ViT( image_size = 224, # image size frames = 12, # number of frames image_patch_size = 4, # image patch size frame_patch_size = 2, # frame patch size num_classes=1024, mlp_dim = 2048, dim = 1024, depth = 6, heads = 8, dropout = 0.1, emb_dropout = 0.1 ) self.T2_ImgEncoder = ViT( image_size = 224, # image size frames = 12, # number of frames image_patch_size = 4, # image patch size frame_patch_size = 2, # frame patch size num_classes=1024, mlp_dim = 2048, dim = 1024, depth = 6, heads = 8, dropout = 0.1, emb_dropout = 0.1 ) input_dim = 1024 elif img_encoder == 'dense3D': self.DWI_ImgEncoder = DenseNet3D() self.T2_ImgEncoder = DenseNet3D() input_dim = 1024 # Attention layers self.ImgAttentionFusion = AttentionFusion(input_dim=input_dim, hidden_dim=256).to(device) def forward(self, DWI_ImgTensor, T2_ImgTensor): if self.img_encoder == 'resnet50': _, DWI_features = self.DWI_ImgEncoder(DWI_ImgTensor) _, T2_features = self.T2_ImgEncoder(T2_ImgTensor) else: DWI_features = self.DWI_ImgEncoder(DWI_ImgTensor) T2_features = self.T2_ImgEncoder(T2_ImgTensor) print (f"DWI_features", DWI_features.shape) fused_features = self.ImgAttentionFusion(DWI_features, T2_features) return fused_features class MLP(nn.Module): """ Standard fully-connected MLP with configurable hidden layers, batch norm, activation, and dropout. Args: input_dim (int): hidden_dims (list of int): output_dim (int): activation (callable or nn.Module): (e.g., nn.ReLU or nn.ReLU()) dropout (float): dropout rate batchnorm (bool): BatchNorm1d """ def init( self, input_dim, hidden_dims, output_dim, activation = nn.ReLU, dropout = 0.0, batchnorm = False, ): super().init() if isinstance(activation, type) and issubclass(activation, nn.Module): activation_layer = activation elif isinstance(activation, nn.Module): activation_layer = lambda: activation else: raise ValueError("activation must be an nn.Module class or instance") layers = [] in_dim = input_dim for h_dim in hidden_dims: layers.append(nn.Linear(in_dim, h_dim)) if batchnorm: layers.append(nn.BatchNorm1d(h_dim)) layers.append(activation_layer()) if dropout > 0: layers.append(nn.Dropout(dropout)) in_dim = h_dim layers.append(nn.Linear(in_dim, output_dim)) self.net = nn.Sequential(*layers) def forward(self, x: torch.Tensor) -> torch.Tensor: """ Args: x: shape (batch_size, input_dim) Returns: shape (batch_size, output_dim) """ return self.net(x) class End2EndModel(nn.Module): def init(self, img_encoder = 'resnet50', device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')): super(End2EndModel, self).init() self.img_encoder = img_encoder if img_encoder == 'resnet50': input_dim = 2048 elif img_encoder == 'vit': input_dim = 1024 elif img_encoder == 'dense3D': input_dim = 1024 self.ImageFusionLayer = ImageFusionModel(img_encoder=self.img_encoder, device=torch.device('cpu')) self.extractedImageFusedLayer = AttentionFusion(input_dim=2030, hidden_dim=2048) self.ImageMLP = MLP(input_dim=input_dim, hidden_dims=[1024], output_dim=512) self.ExtractedImageMLP = MLP(input_dim=2030, hidden_dims=[1024], output_dim=512) self.concat_fusion_layer = MLP(input_dim=512+512+16, hidden_dims=[512], output_dim=1) def forward(self, DWI_ImgTensor, T2_ImgTensor, DWI_feature_tensor, T2_feature_tensor, clinical_features): image_fused_features = self.ImageFusionLayer(DWI_ImgTensor=DWI_ImgTensor, T2_ImgTensor=T2_ImgTensor) extracted_fusion_features = self.extractedImageFusedLayer(feat1=DWI_feature_tensor, feat2=T2_feature_tensor) image_X = self.ImageMLP(image_fused_features) extracted_image_X = self.ExtractedImageMLP(extracted_fusion_features) x = torch.cat((image_X, extracted_image_X, clinical_features), dim=1) output = self.concat_fusion_layer(x) output = nn.Sigmoid()(output) return output, x 在该代码中增加交叉注意力机制模块，DWI_ImgTensor, T2_ImgTensor通过原有的fusion进行融合，DWI_feature_tensor, T2_feature_tensor不做原有的attention fusion ,其后续纳入同一个表格，20个特征，定义为omicsfestures，clinical_features改为3个特征，进一步的，将image_X 分别与omicsfestures和clinical_features进行cross attention 机制融合，其中image_X 作为Q，其余两个为K V。进一步的，将image_X ，cross attention后的omicsfestures，cross attention后的clinical_features进行contact，得到x

特征拼接融合pythonimporttorchimporttorch.nnasnnclassCrossModalFusion(nn.Module):def__init__(self,image_dim,omics_dim,clinical_dim,embed_dim,num_heads):super().__init__()#特征投影层（统一维度）self....

class LinearRegressionModel(nn.Module): def _init_(self,input_dim,output_dim): super(LinnearRegressionModel,self)._init_() self.linear=nn.Linear(input_dim,output_dim) def forward(self,x): out=self.linear(x) return out

def __init__(self, input_dim, output_dim): super(LinearRegressionModel, self).__init__() self.linear = torch.nn.Linear(input_dim, output_dim) def forward(self, x): out = self.linear(x) return ...

我是说找不到你上面说的下面这个改的地方。 1. 主干网络输出层配置问题 (LSKNet.py) 问题：LSKNet默认输出特征图层数不足，导致BiFPN输入索引越界 Python # LSKNet.py 原始代码 class LSKNet(nn.Module): def init(self, ..., out_indices=(0, 1, 2, 3)) # 默认输出4层特征图解决方案：扩展输出层数满足BiFPN需求 Python # 修改后 class LSKNet(nn.Module): def init(self, ..., out_indices=(0, 1, 2, 3, 4)): # 增加输出层 super().init() self.stages = nn.ModuleList([ self._make_stage(...) for _ in range(5) # 确保5个stage ])

def __init__(self, img_size=224, in_chans=3, dim=None, # 修改以下参数 embed_dims=[64, 128, 256, 512, 512], # 新增第5层 mlp_ratios=[8, 8, 4, 4, 4], # 新增第5层比例 depths=[3, 4, 6, 3, 2], # 新增2...

class BERTBiLSTMCRF(nn.Module): def init(self, bert_model_dir, num_labels, hidden_dim=256): super(BERTBiLSTMCRF, self).init() self.bert = BertModel.from_pretrained(bert_model_dir) self.lstm = nn.LSTM(input_size=768, hidden_size=hidden_dim, num_layers=2, batch_first=True, bidirectional=True) self.fc = nn.Linear(hidden_dim * 2, num_labels) self.crf = CRF(num_tags=num_labels, batch_first=True) def forward(self, input_ids, attention_mask=None, labels=None): outputs = self.bert(input_ids=input_ids, attention_mask=attention_mask) sequence_output = outputs.last_hidden_state lstm_out, _ = self.lstm(sequence_output) emissions = self.fc(lstm_out) if labels is not None: loss = -self.crf(emissions, labels, mask=attention_mask.bool(), reduction='mean') return基于上述，设计BERT+BiLSTM+Attention+ CRF的命名实体识别模型

def __init__(self, num_tags, lstm_units=128, dropout_rate=0.3): super().__init__() self.bert = TFBertModel.from_pretrained("bert-base-chinese") self.bilstm = Bidirectional(LSTM(lstm_units, return_...

#增加多头注意力机制 import torch import torch.nn as nn import torch.nn.functional as F from torch.utils.data import DataLoader, TensorDataset import pandas as pd import numpy as np from sklearn.preprocessing import StandardScaler from TCN.tcn import TemporalConvNet,Chomp1d,TemporalBlock import matplotlib.pyplot as plt import time # 配置参数 device = torch.device("cuda" if torch.cuda.is_available() else "cpu") SEQ_LENGTH = 120 BATCH_SIZE = 128 # 减小批次以适应注意力计算 EPOCHS = 100 LEARNING_RATE = 5e-5 # 调整学习率 SPLIT_RATIO = 0.8 # 多头时间注意力模块 class MultiHeadTemporalAttention(nn.Module): def init(self, embed_size, heads=4): super().init() self.embed_size = embed_size self.heads = heads self.head_dim = embed_size // heads self.query = nn.Linear(embed_size, embed_size) self.key = nn.Linear(embed_size, embed_size) self.value = nn.Linear(embed_size, embed_size) self.fc_out = nn.Linear(embed_size, embed_size) def forward(self, x): batch_size, seq_len, _ = x.shape Q = self.query(x).view(batch_size, seq_len, self.heads, self.head_dim).permute(0, 2, 1, 3) K = self.key(x).view(batch_size, seq_len, self.heads, self.head_dim).permute(0, 2, 1, 3) V = self.value(x).view(batch_size, seq_len, self.heads, self.head_dim).permute(0, 2, 1, 3) energy = torch.matmul(Q, K.permute(0, 1, 3, 2)) / (self.head_dim ** 0.5) attention = F.softmax(energy, dim=-1) out = torch.matmul(attention, V) out = out.permute(0, 2, 1, 3).contiguous().view(batch_size, seq_len, self.embed_size) return self.fc_out(out) # 带注意力的时序块 class AttentiveTemporalBlock(nn.Module): def init(self, n_inputs, n_outputs, kernel_size, stride, dilation, padding, dropout=0.2): super().init() self.conv1 = nn.utils.weight_norm(nn.Conv1d( n_inputs, n_outputs, kernel_size, stride=stride, padding=p针对TCN模型改进的多头注意力机制的原理是什么然后使用多头注意力机制进行改进TCN的步骤及流程是什么

self.res = nn.Conv1d(in_channels, out_channels, 1) if in_channels != out_channels else None self.relu = nn.ReLU() def forward(self, x): residual = x if self.res is None else self.res(x) out = ...

import torch import torch.nn as nn import torch.nn.functional as F from torch.utils.data import Dataset, DataLoader import torchaudio import numpy as np import os class WaveNetLayer(nn.Module): """修正后的WaveNet层，确保输出尺寸一致""" def init(self, in_channels, out_channels, dilation): super().init() self.conv_filter = nn.Conv1d(in_channels, out_channels, kernel_size=2, dilation=dilation, padding=dilation) self.conv_gate = nn.Conv1d(in_channels, out_channels, kernel_size=2, dilation=dilation, padding=dilation) self.res_conv = nn.Conv1d(out_channels, in_channels, kernel_size=1) self.skip_conv = nn.Conv1d(out_channels, out_channels, kernel_size=1) def forward(self, x): filtered = torch.tanh(self.conv_filter(x)) gated = torch.sigmoid(self.conv_gate(x)) combined = filtered * gated res = self.res_conv(combined) + x skip = self.skip_conv(combined) return res, skip class WaveNet(nn.Module): """修正后的WaveNet结构，确保特征提取能力""" def init(self, in_channels, hidden_size=128): super().init() self.layers = nn.ModuleList() num_layers = 8 channels = 64 self.start_conv = nn.Conv1d(in_channels, channels, kernel_size=1) # 创建多个膨胀卷积层 for i in range(num_layers): dilation = 2 ** i self.layers.append(WaveNetLayer(channels, channels, dilation)) self.end_conv1 = nn.Conv1d(channels, hidden_size, kernel_size=1) self.end_conv2 = nn.Conv1d(hidden_size, hidden_size, kernel_size=1) def forward(self, x): x = self.start_conv(x) skip_connections = [] for layer in self.layers: x, skip = layer(x) skip_connections.append(skip) # 聚合所有跳跃连接 x = torch.stack(skip_connections).sum(dim=0) x = F.relu(self.end_conv1(x)) x = self.end_conv2(x) return x class OneClassModel(nn.Module): def init(self, encod

self.conv = nn.Conv1d(in_channels, out_channels, kernel_size, padding=(kernel_size-1)*dilation, dilation=dilation) 2. **One-Class特征提取** - 在WaveNet编码器后添加特征压缩层： $$ z = \...

import torch import torch.nn as nn import torch.nn.init as init from TransformerBlock import MultiheadAttention from .NeuralNetwork import NeuralNetwork import torch.nn.functional as F from .GAT import GATConv import torch_geometric.utils as utils class Attention(nn.Module): def init(self, in_features, hidden_size): super(Attention, self).init() self.linear1 = nn.Linear(in_features*2, hidden_size) self.linear2 = nn.Linear(hidden_size, 1) self.activation = nn.ReLU() self.dropout = nn.Dropout(0.5) self.reset_parameters() def reset_parameters(self): init.xavier_normal_(self.linear1.weight) init.xavier_normal_(self.linear2.weight) def forward(self, K, V, mask = None): ''' :param K: (batch_size, d) :param V: (batch_size, hist_len, d) :return: (batch_size, d) ''' K = K.unsqueeze(dim=1).expand(V.size()) fusion = torch.cat([K, V], dim=-1) fc1 = self.activation(self.linear1(fusion)) score = self.linear2(fc1) if mask is not None: mask = mask.unsqueeze(dim=-1) score = score.masked_fill(mask, -2 ** 32 + 1) alpha = F.softmax(score, dim=1) alpha = self.dropout(alpha) att = (alpha * V).sum(dim=1) return att class GLAN(NeuralNetwork): def init(self, config, graph): super(GLAN, self).init() self.config = config embedding_weights = config['embedding_weights'] V, D = embedding_weights.shape maxlen = config['maxlen'] dropout_rate = config['dropout'] alpha = 0.4 self.graph = graph self.word_embedding = nn.Embedding(V, D, padding_idx=0, _weight=torch.from_numpy(embedding_weights)) self.user_tweet_embedding = nn.Embedding(graph.num_nodes, 300, padding_idx=0) self.mh_attention = MultiheadAttention(input_size=300, output_size=300) self.linear_fuse = nn.Lin

def __init__(self, in_features, out_features, num_heads): super().__init__() self.W = nn.Linear(in_features, out_features * num_heads) self.attn = nn.Linear(2 * out_features, 1) self.num_heads = ...

# Copyright 2020 Huawei Technologies Co., Ltd # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. # ============================================================================ """wide and deep model""" import time import numpy as np from mindspore import nn, context from mindspore import Parameter, ParameterTuple import mindspore.common.dtype as mstype import mindspore.ops as ops from mindspore.nn import Dropout from mindspore.nn.optim import Adam, FTRL from mindspore.common.initializer import Uniform, initializer from mindspore.context import ParallelMode from mindspore.nn.wrap.grad_reducer import DistributedGradReducer from mindspore.communication.management import get_group_size np_type = np.float32 ms_type = mstype.float32 def init_method(method, shape, name, max_val=1.0): ''' parameter init method ''' if method in ['uniform']: params = Parameter(initializer( Uniform(max_val), shape, ms_type), name=name) elif method == "one": params = Parameter(initializer("ones", shape, ms_type), name=name) elif method == 'zero': params = Parameter(initializer("zeros", shape, ms_type), name=name) elif method == "normal": params = Parameter(initializer("normal", shape, ms_type), name=name) return params def init_var_dict(init_args, in_vars): ''' var init function ''' var_map = {} _, _max_val = init_args for _, item in enumerate(in_vars): key, shape, method = item if key not in var_map.keys(): if method in ['random', 'uniform']: var_map[key] = Parameter(initializer( Uniform(_max_val), shape, ms_type), name=key) elif method == "one": var_map[key] = Parameter(initializer( "ones", shape, ms_type), name=key) elif method == "zero": var_map[key] = Parameter(initializer( "zeros", shape, ms_type), name=key) elif method == 'normal': var_map[key] = Parameter(initializer( "normal", shape, ms_type), name=key) return var_map class DenseLayer(nn.Cell): """ Dense Layer for Deep Layer of WideDeep Model; Containing: activation, matmul, bias_add; Args: """ def init(self, input_dim, output_dim, weight_bias_init, act_str, keep_prob=0.5, use_activation=True, convert_dtype=True, drop_out=False): super(DenseLayer, self).init() weight_init, bias_init = weight_bias_init self.weight = init_method( weight_init, [input_dim, output_dim], name="weight") self.bias = init_method(bias_init, [output_dim], name="bias") self.act_func = self._init_activation(act_str) self.matmul = ops.MatMul(transpose_b=False) self.bias_add = ops.BiasAdd() self.cast = ops.Cast() self.dropout = Dropout(keep_prob=(1 - keep_prob)) self.use_activation = use_activation self.convert_dtype = convert_dtype self.drop_out = drop_out def _init_activation(self, act_str): act_str = act_str.lower() if act_str == "relu": act_func = ops.ReLU() elif act_str == "sigmoid": act_func = ops.Sigmoid() elif act_str == "tanh": act_func = ops.Tanh() return act_func def construct(self, x): ''' Construct Dense layer ''' if self.training and self.drop_out: x = self.dropout(x) if self.convert_dtype: x = self.cast(x, mstype.float16) weight = self.cast(self.weight, mstype.float16) bias = self.cast(self.bias, mstype.float16) wx = self.matmul(x, weight) wx = self.bias_add(wx, bias) if self.use_activation: wx = self.act_func(wx) wx = self.cast(wx, mstype.float32) else: wx = self.matmul(x, self.weight) wx = self.bias_add(wx, self.bias) if self.use_activation: wx = self.act_func(wx) return wx class WideDeepModel(nn.Cell): """ From paper: " Wide & Deep Learning for Recommender Systems" Args: config (Class): The default config of Wide&Deep """ def init(self, config): super(WideDeepModel, self).init() self.batch_size = config.batch_size host_device_mix = bool(config.host_device_mix) parameter_server = bool(config.parameter_server) parallel_mode = context.get_auto_parallel_context("parallel_mode") is_auto_parallel = parallel_mode in (ParallelMode.SEMI_AUTO_PARALLEL, ParallelMode.AUTO_PARALLEL) if is_auto_parallel: self.batch_size = self.batch_size * get_group_size() sparse = config.sparse self.field_size = config.field_size self.emb_dim = config.emb_dim self.weight_init, self.bias_init = config.weight_bias_init self.deep_input_dims = self.field_size * self.emb_dim self.all_dim_list = [self.deep_input_dims] + config.deep_layer_dim + [1] init_acts = [('Wide_b', [1], config.emb_init)] var_map = init_var_dict(config.init_args, init_acts) self.wide_b = var_map["Wide_b"] self.dense_layer_1 = DenseLayer(self.all_dim_list[0], self.all_dim_list[1], config.weight_bias_init, config.deep_layer_act, convert_dtype=True, drop_out=config.dropout_flag) self.dense_layer_2 = DenseLayer(self.all_dim_list[1], self.all_dim_list[2], config.weight_bias_init, config.deep_layer_act, convert_dtype=True, drop_out=config.dropout_flag) self.dense_layer_3 = DenseLayer(self.all_dim_list[2], self.all_dim_list[3], config.weight_bias_init, config.deep_layer_act, convert_dtype=True, drop_out=config.dropout_flag) self.dense_layer_4 = DenseLayer(self.all_dim_list[3], self.all_dim_list[4], config.weight_bias_init, config.deep_layer_act, convert_dtype=True, drop_out=config.dropout_flag) self.dense_layer_5 = DenseLayer(self.all_dim_list[4], self.all_dim_list[5], config.weight_bias_init, config.deep_layer_act, use_activation=False, convert_dtype=True, drop_out=config.dropout_flag) self.wide_mul = ops.Mul() self.deep_mul = ops.Mul() self.reduce_sum = ops.ReduceSum(keep_dims=False) self.reshape = ops.Reshape() self.deep_reshape = ops.Reshape() self.square = ops.Square() self.concat = ops.Concat(axis=1) self.unique = ops.Unique().shard(((1,),)) self.wide_gatherv2 = ops.Gather() self.deep_gatherv2 = ops.Gather() if is_auto_parallel and sparse and not config.field_slice and not parameter_server: target = 'CPU' if host_device_mix else 'DEVICE' self.wide_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, 1, target=target, slice_mode=nn.EmbeddingLookup.TABLE_ROW_SLICE) if config.deep_table_slice_mode == "column_slice": self.deep_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, self.emb_dim, target=target, slice_mode=nn.EmbeddingLookup.TABLE_COLUMN_SLICE) if config.use_sp: self.dense_layer_1.matmul.shard(((1, get_group_size()), (get_group_size(), 1))) self.dense_layer_1.bias_add.shard(((get_group_size(), 1), (1,))) self.deep_mul.shard(((1, 1, get_group_size()), (1, 1, 1))) else: self.dense_layer_1.dropout.dropout.shard(((1, get_group_size()),)) self.dense_layer_1.matmul.shard(((1, get_group_size()), (get_group_size(), 1))) self.deep_mul.shard(((1, 1, get_group_size()), (1, 1, 1))) self.dense_layer_1.matmul.add_prim_attr("field_size", self.field_size) self.deep_reshape.add_prim_attr("skip_redistribution", True) else: self.deep_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, self.emb_dim, target=target, slice_mode=nn.EmbeddingLookup.TABLE_ROW_SLICE) self.reduce_sum.add_prim_attr("cross_batch", True) self.embedding_table = self.deep_embeddinglookup.embedding_table elif is_auto_parallel and host_device_mix and config.field_slice and config.full_batch and config.manual_shape: manual_shapes = tuple((s[0] for s in config.manual_shape)) self.deep_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, self.emb_dim, slice_mode=nn.EmbeddingLookup.FIELD_SLICE, manual_shapes=manual_shapes) self.wide_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, 1, slice_mode=nn.EmbeddingLookup.FIELD_SLICE, manual_shapes=manual_shapes) self.deep_mul.shard(((1, get_group_size(), 1), (1, get_group_size(), 1))) self.wide_mul.shard(((1, get_group_size(), 1), (1, get_group_size(), 1))) self.reduce_sum.shard(((1, get_group_size(), 1),)) self.dense_layer_1.dropout.dropout.shard(((1, get_group_size()),)) self.dense_layer_1.matmul.shard(((1, get_group_size()), (get_group_size(), 1))) self.embedding_table = self.deep_embeddinglookup.embedding_table elif parameter_server: cache_enable = config.vocab_cache_size > 0 target = 'DEVICE' if cache_enable else 'CPU' if not cache_enable: sparse = True if is_auto_parallel and config.full_batch and cache_enable: self.deep_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, self.emb_dim, target=target, slice_mode=nn.EmbeddingLookup.TABLE_ROW_SLICE, sparse=sparse, vocab_cache_size=config.vocab_cache_size) self.wide_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, 1, target=target, slice_mode=nn.EmbeddingLookup.TABLE_ROW_SLICE, sparse=sparse, vocab_cache_size=config.vocab_cache_size) else: self.deep_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, self.emb_dim, target=target, sparse=sparse, vocab_cache_size=config.vocab_cache_size) self.wide_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, 1, target=target, sparse=sparse, vocab_cache_size=config.vocab_cache_size) self.embedding_table = self.deep_embeddinglookup.embedding_table self.deep_embeddinglookup.embedding_table.set_param_ps() self.wide_embeddinglookup.embedding_table.set_param_ps() else: self.deep_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, self.emb_dim, target='DEVICE', sparse=sparse, vocab_cache_size=config.vocab_cache_size) self.wide_embeddinglookup = nn.EmbeddingLookup(config.vocab_size, 1, target='DEVICE', sparse=sparse, vocab_cache_size=config.vocab_cache_size) self.embedding_table = self.deep_embeddinglookup.embedding_table def construct(self, id_hldr, wt_hldr): """ Args: id_hldr: batch ids; wt_hldr: batch weights; """ # Wide layer wide_id_weight = self.wide_embeddinglookup(id_hldr) # Deep layer deep_id_embs = self.deep_embeddinglookup(id_hldr) mask = self.reshape(wt_hldr, (self.batch_size, self.field_size, 1)) # Wide layer wx = self.wide_mul(wide_id_weight, mask) wide_out = self.reshape(self.reduce_sum(wx, 1) + self.wide_b, (-1, 1)) # Deep layer vx = self.deep_mul(deep_id_embs, mask) deep_in = self.deep_reshape(vx, (-1, self.field_size * self.emb_dim)) deep_in = self.dense_layer_1(deep_in) deep_in = self.dense_layer_2(deep_in) deep_in = self.dense_layer_3(deep_in) deep_in = self.dense_layer_4(deep_in) deep_out = self.dense_layer_5(deep_in) out = wide_out + deep_out return out, self.embedding_table class NetWithLossClass(nn.Cell): """" Provide WideDeep training loss through network. Args: network (Cell): The training network config (Class): WideDeep config """ def init(self, network, config): super(NetWithLossClass, self).init(auto_prefix=False) host_device_mix = bool(config.host_device_mix) parameter_server = bool(config.parameter_server) sparse = config.sparse parallel_mode = context.get_auto_parallel_context("parallel_mode") is_auto_parallel = parallel_mode in (ParallelMode.SEMI_AUTO_PARALLEL, ParallelMode.AUTO_PARALLEL) self.no_l2loss = (is_auto_parallel if (host_device_mix or config.field_slice) else parameter_server) if sparse: self.no_l2loss = True self.network = network self.l2_coef = config.l2_coef self.loss = ops.SigmoidCrossEntropyWithLogits() self.square = ops.Square() self.reduceMean_false = ops.ReduceMean(keep_dims=False) if is_auto_parallel: self.reduceMean_false.add_prim_attr("cross_batch", True) self.reduceSum_false = ops.ReduceSum(keep_dims=False) def construct(self, batch_ids, batch_wts, label): ''' Construct NetWithLossClass ''' predict, embedding_table = self.network(batch_ids, batch_wts) log_loss = self.loss(predict, label) wide_loss = self.reduceMean_false(log_loss) if self.no_l2loss: deep_loss = wide_loss else: l2_loss_v = self.reduceSum_false(self.square(embedding_table)) / 2 deep_loss = self.reduceMean_false(log_loss) + self.l2_coef * l2_loss_v return wide_loss, deep_loss class IthOutputCell(nn.Cell): def init(self, network, output_index): super(IthOutputCell, self).init() self.network = network self.output_index = output_index def construct(self, x1, x2, x3): predict = self.network(x1, x2, x3)[self.output_index] return predict class TrainStepWrap(nn.Cell): """ Encapsulation class of WideDeep network training. Append Adam and FTRL optimizers to the training network after that construct function can be called to create the backward graph. Args: network (Cell): The training network. Note that loss function should have been added. sens (Number): The adjust parameter. Default: 1024.0 host_device_mix (Bool): Whether run in host and device mix mode. Default: False parameter_server (Bool): Whether run in parameter server mode. Default: False """ def init(self, network, sens=1024.0, host_device_mix=False, parameter_server=False, sparse=False, cache_enable=False): super(TrainStepWrap, self).init() parallel_mode = context.get_auto_parallel_context("parallel_mode") is_auto_parallel = parallel_mode in (ParallelMode.SEMI_AUTO_PARALLEL, ParallelMode.AUTO_PARALLEL) self.network = network self.network.set_train() self.trainable_params = network.trainable_params() weights_w = [] weights_d = [] for params in self.trainable_params: if 'wide' in params.name: weights_w.append(params) else: weights_d.append(params) self.weights_w = ParameterTuple(weights_w) self.weights_d = ParameterTuple(weights_d) if (sparse and is_auto_parallel) or (sparse and parameter_server): self.optimizer_d = Adam( self.weights_d, learning_rate=5e-4, eps=1e-8, loss_scale=sens, use_lazy=True) self.optimizer_w = FTRL(learning_rate=1e-3, params=self.weights_w, l1=1e-8, l2=1e-8, initial_accum=1.0, loss_scale=sens) if host_device_mix or (parameter_server and not cache_enable): self.optimizer_w.target = "CPU" self.optimizer_d.target = "CPU" else: self.optimizer_d = Adam( self.weights_d, learning_rate=5e-4, eps=1e-8, loss_scale=sens) self.optimizer_w = FTRL(learning_rate=1e-3, params=self.weights_w, l1=1e-8, l2=1e-8, initial_accum=1.0, loss_scale=sens) self.hyper_map = ops.HyperMap() self.grad_w = ops.GradOperation(get_by_list=True, sens_param=True) self.grad_d = ops.GradOperation(get_by_list=True, sens_param=True) self.sens = sens self.loss_net_w = IthOutputCell(network, output_index=0) self.loss_net_d = IthOutputCell(network, output_index=1) self.loss_net_w.set_grad() self.loss_net_d.set_grad() self.reducer_flag = False self.grad_reducer_w = None self.grad_reducer_d = None self.reducer_flag = parallel_mode in (ParallelMode.DATA_PARALLEL, ParallelMode.HYBRID_PARALLEL) if self.reducer_flag: mean = context.get_auto_parallel_context("gradients_mean") degree = context.get_auto_parallel_context("device_num") self.grad_reducer_w = DistributedGradReducer(self.optimizer_w.parameters, mean, degree) self.grad_reducer_d = DistributedGradReducer(self.optimizer_d.parameters, mean, degree) def construct(self, batch_ids, batch_wts, label): ''' Construct wide and deep model ''' weights_w = self.weights_w weights_d = self.weights_d loss_w, loss_d = self.network(batch_ids, batch_wts, label) sens_w = ops.Fill()(ops.DType()(loss_w), ops.Shape()(loss_w), self.sens) sens_d = ops.Fill()(ops.DType()(loss_d), ops.Shape()(loss_d), self.sens) grads_w = self.grad_w(self.loss_net_w, weights_w)(batch_ids, batch_wts, label, sens_w) grads_d = self.grad_d(self.loss_net_d, weights_d)(batch_ids, batch_wts, label, sens_d) if self.reducer_flag: grads_w = self.grad_reducer_w(grads_w) grads_d = self.grad_reducer_d(grads_d) return ops.depend(loss_w, self.optimizer_w(grads_w)), ops.depend(loss_d, self.optimizer_d(grads_d)) class PredictWithSigmoid(nn.Cell): """ Predict definition """ def init(self, network): super(PredictWithSigmoid, self).init() self.network = network self.sigmoid = ops.Sigmoid() parallel_mode = context.get_auto_parallel_context("parallel_mode") full_batch = context.get_auto_parallel_context("full_batch") is_auto_parallel = parallel_mode in (ParallelMode.SEMI_AUTO_PARALLEL, ParallelMode.AUTO_PARALLEL) if is_auto_parallel and full_batch: self.sigmoid.shard(((1, 1),)) def construct(self, batch_ids, batch_wts, labels): logits, _, = self.network(batch_ids, batch_wts) pred_probs = self.sigmoid(logits) return logits, pred_probs, labels # Pre processing def pre_process_criteo_wide_deep(x): return x class WideDeepPostProcess: def init(self): self.good = 0 self.total = 0 self.roc_auc = 0 self.results = [] self.labels = [] def call(self, results, expected=None, result_dict=None): processed_results = [] n = len(results) for idx in range(0, n): result = results['auc'] processed_results.append(result) self.good += 1 self.total += 1 return processed_results def add_results(self, labels, results): self.results.append(results) self.labels.append(labels) def start(self): self.good = 0 self.total = 0 self.roc_auc = 0 self.results = [] def finalize(self, result_dict, ds=False, output_dir=None): result_dict["good"] = self.good result_dict["total"] = self.total 我在将模型和权重转化成onnx文件时需要将模型代码中的训练部分去除么？

#y仅在训练时传入标签out=self.linear(x)ifyisnotNone:#训练分支returnself.loss_fn(out,y)returnout#推理分支**转换前需修改为**：pythonclassWideDeepModelForExport(nn.Module):def__init__(self,base_...

运行以下Python代码：import torchimport torch.nn as nnimport torch.optim as optimfrom torchvision import datasets, transformsfrom torch.utils.data import DataLoaderfrom torch.autograd import Variableclass Generator(nn.Module): def init(self, input_dim, output_dim, num_filters): super(Generator, self).init() self.input_dim = input_dim self.output_dim = output_dim self.num_filters = num_filters self.net = nn.Sequential( nn.Linear(input_dim, num_filters), nn.ReLU(), nn.Linear(num_filters, num_filters2), nn.ReLU(), nn.Linear(num_filters2, num_filters4), nn.ReLU(), nn.Linear(num_filters4, output_dim), nn.Tanh() ) def forward(self, x): x = self.net(x) return xclass Discriminator(nn.Module): def init(self, input_dim, num_filters): super(Discriminator, self).init() self.input_dim = input_dim self.num_filters = num_filters self.net = nn.Sequential( nn.Linear(input_dim, num_filters4), nn.LeakyReLU(0.2), nn.Linear(num_filters4, num_filters2), nn.LeakyReLU(0.2), nn.Linear(num_filters2, num_filters), nn.LeakyReLU(0.2), nn.Linear(num_filters, 1), nn.Sigmoid() ) def forward(self, x): x = self.net(x) return xclass ConditionalGAN(object): def init(self, input_dim, output_dim, num_filters, learning_rate): self.generator = Generator(input_dim, output_dim, num_filters) self.discriminator = Discriminator(input_dim+1, num_filters) self.optimizer_G = optim.Adam(self.generator.parameters(), lr=learning_rate) self.optimizer_D = optim.Adam(self.discriminator.parameters(), lr=learning_rate) def train(self, data_loader, num_epochs): for epoch in range(num_epochs): for i, (inputs, labels) in enumerate(data_loader): # Train discriminator with real data real_inputs = Variable(inputs) real_labels = Variable(labels) real_labels = real_labels.view(real_labels.size(0), 1) real_inputs = torch.cat((real_inputs, real_labels), 1) real_outputs = self.discriminator(real_inputs) real_loss = nn.BCELoss()(real_outputs, torch.ones(real_outputs.size())) # Train discriminator with fake data noise = Variable(torch.randn(inputs.size(0), self.generator.input_dim)) fake_labels = Variable(torch.LongTensor(inputs.size(0)).random_(0, 10)) fake_labels = fake_labels.view(fake_labels.size(0), 1) fake_inputs = self.generator(torch.cat((noise, fake_labels.float()), 1)) fake_inputs = torch.cat((fake_inputs, fake_labels), 1) fake_outputs = self.discriminator(fake_inputs) fake_loss = nn.BCELoss()(fake_outputs, torch.zeros(fake_outputs.size())) # Backpropagate and update weights for discriminator discriminator_loss = real_loss + fake_loss self.discriminator.zero_grad() discriminator_loss.backward() self.optimizer_D.step() # Train generator noise = Variable(torch.randn(inputs.size(0), self.generator.input_dim)) fake_labels = Variable(torch.LongTensor(inputs.size(0)).random_(0,

def __init__(self, input_dim, output_dim, num_filters, learning_rate): self.generator = Generator(input_dim, output_dim, num_filters) self.discriminator = Discriminator(input_dim+1, num_filters) ...

class ASPP(nn.Module): def init(self, dim_in, dim_out, rate=1, bn_mom=0.1): super(ASPP, self).init() self.branch1 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 1, 1, padding=0, dilation=rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True), ) self.branch2 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=4 * rate, dilation=4 * rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True), ) self.branch3 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=8 * rate, dilation=8 * rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True), ) self.branch4 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=12 * rate, dilation=12 * rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True), ) self.branch5 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=16 * rate, dilation=16 * rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True), ) self.branch6 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=20 * rate, dilation=20 * rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True) ) self.branch7 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=24 * rate, dilation=24 * rate, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True) ) self.branch8_conv = nn.Conv2d(dim_in, dim_out, 1, 1, 0, bias=True) self.branch8_bn = nn.BatchNorm2d(dim_out, momentum=bn_mom) self.branch8_relu = nn.ReLU(inplace=True) self.conv_cat = nn.Sequential( nn.Conv2d(dim_out * 8, dim_out, 1, 1, padding=0, bias=True), nn.BatchNorm2d(dim_out, momentum=bn_mom), nn.ReLU(inplace=True), )用1×3卷积和3×1卷积代替这段代码的3×3卷积

nn.Conv2d(dim_in, dim_out, (1, 3), 1, padding=(0, 4 * rate), dilation=4 * rate, bias=True), nn.Conv2d(dim_out, dim_out, (3, 1), 1, padding=(4 * rate, 0), dilation=4 * rate, bias=True), nn.BatchNorm...

class OrientedASPP(nn.Module): def init(self, dim_in, dim_out, rate=1): super().init() # 方向滤波器组：0°, 45°, 90°, 135° self.conv_arrange = nn.Sequential( nn.AdaptiveAvgPool2d((1, 1)), nn.Conv2d(dim_in, dim_out, 1, 1, 0, bias=True), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True) ) self.branch1 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 1, 1, padding=0, dilation=rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.branch2 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=6 * rate, dilation=6 * rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.branch3 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=12 * rate, dilation=12 * rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.branch4 = nn.Sequential( nn.Conv2d(dim_in, dim_out, 3, 1, padding=18 * rate, dilation=18 * rate, bias=True), # SynchronizedBatchNorm2d(dim_out, momentum=bn_mom), nn.BatchNorm2d(dim_out), nn.ReLU(inplace=True), ) self.convs = nn.ModuleList([ self.branch1, self.branch2, self.branch3, self.branch4, self.conv_arrange ]) self.orient_att = nn.Sequential( # 方向注意力 nn.Conv2d(5 * dim_out, 5, 1), nn.Softmax(dim=1) ) def forward(self, x): feats = [conv(x) for conv in self.convs] fused = torch.cat(feats, dim=1) att = self.orient_att(fused) # [N,4,H,W] # 方向加权融合 return sum([att[:, i:i + 1] * feats[i] for i in range(5)]) 报错RuntimeError: Sizes of tensors must match except in dimension 1. Expected size 288 but got size 1 for tensor number 4 in the list.如何解决

self.conv_arrange = nn.Conv2d(dim_in, dim_out, 1) 4. **推荐实现**：建议采用方案一，修改后的模块结构应为： python self.conv_arrange = nn.Sequential( nn.Conv2d(dim_in, dim_out, 1, 1, 0, bias=...

class OrientedASPP(nn.Module): def init(self, in_ch, out_ch, rates=[6,12,18]): super().init() # 方向滤波器组：0°, 45°, 90°, 135° self.convs = nn.ModuleList([ nn.Conv2d(in_ch, out_ch, 3, padding=rate, dilation=rate) for rate in rates ]) self.orient_att = nn.Sequential( # 方向注意力 nn.Conv2d(len(rates)out_ch, 4, 1), nn.Softmax(dim=1) ) def forward(self, x): feats = [conv(x) for conv in self.convs] fused = torch.cat(feats, dim=1) att = self.orient_att(fused) # [N,4,H,W] # 方向加权融合 return sum([att[:,i:i+1]feats[i] for i in range(4)]) 在这个基础上增加不使用膨胀卷积的一层，和平均池化层

class OrientedASPP(nn.Module): def __init__(self, in_ch, out_ch, rates=[6,12,18]): super().__init__() # 原始膨胀卷积分支（rates=[6,12,18]） self.convs = nn.ModuleList([ nn.Conv2d(in_ch, out_ch, 3...

光储直流微电网的协调控制与直流电压分层优化

内容概要：本文探讨了光储直流微电网的协调控制及其关键技术，重点介绍了直流电压分层优化控制方法和逆变器......

相关推荐

Python RuntimeError: thread.__init__() not called解决方法

bst.rar_bst_bst tree

python基础进阶1.6：面向对象之类，对象及__init__()，self相关用法讲解

class LinearRegressionModel(nn.Module): def _init_(self,input_dim,output_dim): super(LinnearRegressionModel,self)._init_() self.linear=nn.Linear(input_dim,output_dim) def forward(self,x): out=self.linear(x) return out

光储直流微电网的协调控制与直流电压分层优化

大家在看

ISO/IEC 27001:2022与ISO 27002:2022最新版中英文版合集

华为模拟器(Enterprise Network Simulator )命令参考手册.zip

dspic最小系统

斯蒂芬-玻尔兹曼定律-红外成像论文资料

删除ip gurad软件，拒绝监管

最新推荐

Info2007v1.0更新至v2.0：优化管理与前台功能

Rust测试实战：错误处理、环境变量与模拟服务器

op-drone:监控未平仓头寸的市场利器

RustWeb服务部署与环境变量配置全解析

消灭病毒 源代码

Apache Directory：Java编写的LDAP v3兼容目录解决方案

Rust项目中用户认证与登录功能的实现与优化

如何使用使用QZipReader解压文件

Rust频谱分析库：利用FFT快速获得音频频谱

Python RuntimeError: thread.init() not called解决方法

python基础进阶1.6：面向对象之类，对象及init()，self相关用法讲解

消灭病毒源代码