U-net

最新推荐文章于 2024-05-07 19:50:07 发布

wzy_barry

最新推荐文章于 2024-05-07 19:50:07 发布

阅读量171

点赞数

分类专栏：机器学习文章标签：深度学习人工智能 python

本文链接：https://blog.youkuaiyun.com/weixin_45598684/article/details/130622084

版权

机器学习专栏收录该内容

4 篇文章

订阅专栏

该代码实现了一个基于PyTorch的U-net模型，用于图像分割任务。模型包括InConv（输入卷积）、Down（下采样层，含最大池化和双卷积）、Up（上采样层，含转置卷积或双线性插值）和OutConv（输出层）。通过双卷积层进行特征提取，结合上采样和下采样的结构，以处理不同尺度的信息。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.nn.init as init


class DoubleConv(nn.Module):
    """(convolution => [BN] => ReLU ) * 2"""
    
    def __init__(self, in_channels, out_channels, mid_channels=None):
        super().__init__()
        # 如果未指定中间通道数，就将其设为输出通道数
        if not mid_channels:
            mid_channels = out_channels
        # 定义双卷积层
        self.double_conv = nn.Sequential(
            nn.Conv2d(in_channels, mid_channels, kernel_size=3, padding=1),
            nn.BatchNorm2d(mid_channels),
            nn.ReLU(inplace=True),
            nn.Conv2d(mid_channels, out_channels, kernel_size=3, padding=1),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True)
        )
    
    def forward(self, x):
        return self.double_conv(x)


class Down(nn.Module):
    """Downscaling with maxpool then double conv"""
    
    def __init__(self, in_channels, out_channels):
        super().__init__()
        # 定义一个包含最大池化层和双卷积层的Sequential模块
        self.maxpool_conv = nn.Sequential(
            # 步长默认为2，和kernel_size
            nn.MaxPool2d(2),  # 最大池化层，核大小为2  B*C*H*W => B*C*H/2*W/2，将尺寸分别减半了，但是通道数不变
            DoubleConv(in_channels, out_channels)
        )
    
    def forward(self, x):
        return self.maxpool_conv(x)

class up(nn.Module):
    """
    up path
    conv_transpose => double_conv
    """
    def __init__(self, in_ch, out_ch, Transpose=False):
        super(up, self).__init__()
    
        # would be a nice idea if the upsampling could be learned too,
        # but my machine do not have enough memory to handle all those weights    
        if Transpose:
            self.up = nn.ConvTranspose2d(in_ch, in_ch//2, 2, stride=2)   # 转置卷积，步长为2，kernel为2
        else:
            self.up = nn.Sequential(
                nn.Upsample(scale_factor=2, mode='bilinear',align_corners=True),  # 双线性插值1上采样，比例为2
                nn.Conv2d(in_ch, in_ch//2, kernel_size=1, padding=0),             # 1 * 1 卷积，减少通道数
                nn.ReLU(inplace=True)
                )
        self.conv = DoubleConv(in_ch, out_ch)
        self.up.apply(self.init_weights)   # 初始化权重
    
    def forward(self, x1, x2):
        x1 = self.up(x1)  # 上采样
        
        diffY = x2.size()[2] - x1.size()[2]  # 计算 x2 和 x1 的高度差
        diffX = x2.size()[3] - x1.size()[3]  # 计算 x2 和 x1 的宽度差
        
        # 对 x1 进行补零
        x1 = nn.functional.pad(x1, (diffX // 2, diffX - diffX//2,
                                    diffY // 2, diffY - diffY//2))
        x = torch.cat([x2, x1], dim=1)   # skip connection
        x = self.conv(x)
        return x
    
    @staticmethod
    def init_weights(m):
        if type(m) == nn.Conv2d:
            init.xavier_normal_(m.weight)  # Xavier初始化
            init.constant_(m.bias, 0)      # 常数初始化，设置为0
          

class OutConv(nn.Module):
    '''U-net最后的输出层'''
    def __init__(self, in_channels, out_channels):
        super(OutConv, self).__init__()
        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1)  # 定义一个1 * 1卷积层，将输入的特征图映射为输出的特征图
    
    def forward(self, x):
        return self.conv(x)

class InConv(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(InConv, self).__init__()
        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1)
    
    def forward(self, x):
        return self.conv(x)
  

class Unet(nn.Module):
    def __init__(self, in_ch, out_ch=1):
        super(Unet, self).__init__()
        self.loss_stack = 0
        self.matrix_iou_stack = 0
        self.stack_count = 0
        self.display_names = ['loss_stack', 'matrix_iou_stack']
        self.bce_loss = nn.BCELoss()
        self.device = torch.device('cuda' if torch.cuda.is_available() else 'cpu') 
        self.inc = InConv(in_ch, 64)  # 输入卷积层
        self.down1 = Down(64, 128)    # 下采样层 1
        self.down2 = Down(128, 256)   # 下采样层 2
        self.down3 = Down(256, 512)   
        self.drop3 = nn.Dropout2d(0.5)
        self.down4 = Down(512, 1024)
        self.drop4 = nn.Dropout2d(0.5)
        self.up1 = up(1024, 512, False)
        self.up2 = up(512, 256, False)
        self.up3 = up(256, 128, False)
        self.up4 = up(128, 64, False)
        self.outc = OutConv(64, out_ch)
        self.optimizer = torch.optim.Adam(self.parameters(), lr=1e-4)  # 定义优化器
        
    def forward(self, x):
        x1 = self.inc(x)
        x2 = self.down1(x1)
        x3 = self.down2(x2)
        x4 = self.down3(x3)
        x4 = self.drop3(x4)
        x5 = self.down4(x4)
        x5 = self.drop4(x5)
        # 下采样结束，开始上采样
        x = self.up1(x5, x4)
        x = self.up2(x, x3)
        x = self.up3(x, x2)
        x = self.up4(x, x1)
        x = self.outc(x)
        self.pred_y = torch.sigmoid(x)
        return self.pred_y