单通道合并为三通道输入resnet网络

我们在做多序列任务时，一个患者会有多个序列的图像，每个序列的图像都是1通道的灰度图像，我们可以把一个患者的多有序列合并为多通道输入网络，这里举个3序列的例子。

1.输入之前合并

在输入之前将三张1通道合并为3通道图像，然后设置了参数chunk为3，意思就是将输入的通道拆分为3份，每一份进行网络中卷积后，再将三个卷积后的特征进行拼接。有点类似D-W卷积。

import torch
import torch.nn as nn
import torchvision.models as models


class CustomResNet50(nn.Module):
    def __init__(self,  in_channels=1,num_classes=2, chunk=3):
        super(CustomResNet50, self).__init__()
        self.chunk = chunk
        # 加载预训练的ResNet-50模型
        resnet = models.resnet50(pretrained=True)

        # 将修改后的模型赋值给自定义的ResNet-50网络
        self.model = resnet

        # 修改第一个卷积层的输入通道数
        self.model.conv1 = nn.Conv2d(in_channels, 64, kernel_size=7, stride=2, padding=3, bias=False)

        # 修改全连接层的输出特征数
        self.fc = nn.Linear(2048 * self.chunk, num_classes)


    def  cat(self,x):
        x = self.model.conv1(x)
        x = self.model.bn1(x)
        x = self.model.relu(x)
        x = self.model.maxpool(x)

        x = self.model.layer1(x)
        x = self.model.layer2(x)
        x = self.model.layer3(x)
        x = self.model.layer4(x)
        x = self.model.avgpool(x)
        x = torch.flatten(x, 1)
        return x


    def forward(self, x ):
        # 对输入的三通道图像进行分割
        self.data = []
        split_data = torch.split(x, 1, dim=1)
        for i in range(self.chunk):
            self.data.append(self.cat(split_data[i]))

        # 在全连接层之前进行拼接
        x = torch.cat(self.data, dim=1)


        # 全连接层输出
        output = self.fc(x)

        return output

if __name__ == '__main__':
    # 创建一个实例，并指定类别数
    net = CustomResNet50( in_channels=1,num_classes=2,chunk=3)

    # 输出网络结构
    print(net)
#
#
#
#     # 在输入数据上进行前向传播
#     input_data = torch.randn(64, 3, 224, 224)  # 假设输入数据尺寸为1x224x224
#     output = net(input_data)
#     print("前连接层特征尺寸:", output.size())

2.在输入网络中合并

输入的是一个字典，将三个序列的数据保存在字典中，从字典中读取每个序列的数据，然后进行网络卷积，三个序列卷积之后，再进行合并。这里的chunk主要是调整合并后的特征数，经线性层到分类数。并没有起到拆分的作用。

import torch
import torch.nn as nn
import torchvision.models as models


class CustomResNet50(nn.Module):
    def __init__(self,  in_channels=1,num_classes=2, chunk=3):
        super(CustomResNet50, self).__init__()
        self.chunk = chunk
        # 加载预训练的ResNet-50模型
        resnet = models.resnet50(pretrained=True)

        # 将修改后的模型赋值给自定义的ResNet-50网络
        self.model = resnet

        # 修改第一个卷积层的输入通道数
        self.model.conv1 = nn.Conv2d(in_channels, 64, kernel_size=7, stride=2, padding=3, bias=False)

        # 修改全连接层的输出特征数
        self.fc = nn.Linear(2048 * self.chunk, num_classes)


    def  cat(self,x):
        x = self.model.conv1(x)
        x = self.model.bn1(x)
        x = self.model.relu(x)
        x = self.model.maxpool(x)

        x = self.model.layer1(x)
        x = self.model.layer2(x)
        x = self.model.layer3(x)
        x = self.model.layer4(x)
        x = self.model.avgpool(x)
        x = torch.flatten(x, 1)
        return x


    def forward(self, x ):

        low_energy = x['LOW_ENERGY']
        high_energy = x['HIGH_ENERGY']
        enhance = x['ENHANCE']

        low_energy = self.cat(low_energy)
        high_energy = self.cat(high_energy)
        enhance = self.cat(enhance)
        # # 对输入的三通道图像进行分割
        # self.data = []
        # split_data = torch.split(x, 1, dim=1)
        # for i in range(self.chunk):
        #     self.data.append(self.cat(split_data[i]))

        # 在全连接层之前进行拼接
        x = torch.cat((low_energy,high_energy,enhance), dim=1)

        # 全连接层输出
        output = self.fc(x)

        return output

if __name__ == '__main__':
    # 创建一个实例，并指定类别数
    net = CustomResNet50( in_channels=1,num_classes=2,chunk=3)

    # 输出网络结构
    # print(net)


    #
    # # 在输入数据上进行前向传播
    # input_data = torch.randn(64, 3, 224, 224)  # 假设输入数据尺寸为1x224x224
    # output = net(input_data)
    # print("前连接层特征尺寸:", output.size())

    input_data = {'LOW_ENERGY':torch.randn(64,1, 224, 224) ,
                  'HIGH_ENERGY': torch.randn(64,1, 224, 224),
                  'ENHANCE': torch.randn(64,1, 224, 224),
                  } # 假设输入数据尺寸为1x224x224
    output = net(input_data)
    print("前连接层特征尺寸:", output.size())

本文来自互联网用户投稿，该文观点仅代表作者本人，不代表本站立场。本站仅提供信息存储空间服务，不拥有所有权，不承担相关法律责任。如若转载，请注明出处：http://www.mfbz.cn/a/595573.html

如若内容造成侵权/违法违规/事实不符，请联系我们进行投诉反馈qq邮箱809451989@qq.com，一经查实，立即删除！