Source code for ADFWI.dip.model.Unet

import torch
import torch.nn as nn
import torch.nn.functional as F
from FyeldGenerator import generate_field
import numpy as np

# Helper that generates power-law power spectrum
[docs]def Pkgen(n):
    """
    Generates a power spectrum function with a given power-law exponent.
    """
    def Pk(k):
        return np.power(k, -n)
    return Pk

# Draw samples from a normal distribution
[docs]def distrib(shape):
    """
    Generates complex random samples from a normal distribution.
    """
    a = np.random.normal(loc=0, scale=1, size=shape)
    b = np.random.normal(loc=0, scale=1, size=shape)
    return a + 1j * b

[docs]def generate_grf(shape, alpha, unit_length=10, device='cpu'):
    """
    Generates a Gaussian random field using the provided parameters.
    """
    field = generate_field(distrib, Pkgen(alpha), shape, unit_length=unit_length)
    return torch.tensor(field, dtype=torch.float32, device=device)

# Double convolution block
[docs]class DoubleConv(nn.Module):
    """
    A module that applies two consecutive convolutions, each followed by batch normalization and a LeakyReLU activation.
    """
    def __init__(self, in_channels, out_channels, mid_channels=None):
        super(DoubleConv, self).__init__()
        if not mid_channels:
            mid_channels = out_channels
        self.double_conv = nn.Sequential(
            nn.Conv2d(in_channels, mid_channels, kernel_size=3, padding=1, bias=False),
            nn.BatchNorm2d(mid_channels),
            nn.LeakyReLU(0.1),
            nn.Conv2d(mid_channels, out_channels, kernel_size=3, padding=1, bias=False),
            nn.BatchNorm2d(out_channels),
            nn.LeakyReLU(0.1)
        )

[docs]    def forward(self, x):
        """
        Forward pass of the DoubleConv block.
        """
        return self.double_conv(x)

# Downscaling block
[docs]class Down(nn.Module):
    """
    A downscaling block that applies a convolution followed by max pooling.
    """
    def __init__(self, in_channels, out_channels):
        super(Down, self).__init__()
        self.maxpool_conv = nn.Sequential(
            DoubleConv(in_channels, out_channels),
            nn.MaxPool2d(2),
        )

[docs]    def forward(self, x):
        """
        Forward pass of the Down block.
        """
        return self.maxpool_conv(x)

# Upscaling block
[docs]class Up(nn.Module):
    """
    An upscaling block that applies either bilinear upsampling or transposed convolution, followed by a convolution.
    """
    def __init__(self, in_channels, out_channels, bilinear=True):
        super(Up, self).__init__()
        if bilinear:
            self.up = nn.Upsample(scale_factor=2, mode='bilinear', align_corners=True)
            self.conv = DoubleConv(in_channels, out_channels, in_channels // 2)
        else:
            self.up = nn.ConvTranspose2d(in_channels, in_channels // 2, kernel_size=2, stride=2)
            self.conv = DoubleConv(in_channels, out_channels)

[docs]    def forward(self, x1, x2):
        """
        Forward pass of the Up block.
        """
        x1 = self.up(x1)
        diffY = x2.size()[2] - x1.size()[2]
        diffX = x2.size()[3] - x1.size()[3]
        x1 = F.pad(x1, [diffX // 2, diffX - diffX // 2, diffY // 2, diffY - diffY // 2])
        x = torch.cat([x2, x1], dim=1)
        return self.conv(x)

# Output layer
[docs]class OutConv(nn.Module):
    """
    The output convolution layer that applies a 1x1 convolution to the input tensor.
    """
    def __init__(self, in_channels, out_channels):
        super(OutConv, self).__init__()
        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=1)

[docs]    def forward(self, x):
        """
        Forward pass of the output convolution layer.
        """
        return self.conv(x)

# General UNet class for any number of layers
[docs]class UNet(nn.Module):
    """
    A flexible UNet model that can be configured with different numbers of layers and channels.

    Parameters
    ----------
    model_shape : tuple
        The shape of the input model (height, width).
    n_layers : int
        The number of layers in the encoder-decoder network.
    base_channel : int
        The base number of channels at the input.
    vmin : float, optional
        The minimum value for the output, used for rescaling, default is None.
    vmax : float, optional
        The maximum value for the output, used for rescaling, default is None.
    in_channels : int, optional
        The number of input channels, default is 1.
    out_channels : int, optional
        The number of output channels, default is 1.
    bilinear : bool, optional
        Whether to use bilinear upsampling instead of transposed convolution, default is False.
    grf_initialize : bool, optional
        Whether to initialize the model with a Gaussian random field, default is False.
    grf_alpha : float, optional
        The power-law exponent for the Gaussian random field initialization, default is 0.
    unit : int, optional
        A scaling factor for the output, default is 1000.
    device : str, optional
        The device for tensor computations, default is 'cpu'.
    """
    def __init__(self, model_shape, 
                 n_layers, 
                 base_channel, 
                 vmin=None, 
                 vmax=None, 
                 in_channels=1, out_channels=1, 
                 bilinear=False,
                 grf_initialize=False,
                 grf_alpha = 0, # power-law power spectrum
                 unit = 1000, 
                 device="cpu"
                 ):
        super(UNet, self).__init__()
        self.in_channels    = in_channels
        self.out_channels   = out_channels
        self.model_shape    = model_shape
        self.bilinear       = bilinear
        self.unit   = unit
        
        self.grf_initialize = grf_initialize
        self.grf_alpha = grf_alpha

        self.inc    = DoubleConv(in_channels, base_channel)
        self.downs  = nn.ModuleList()
        self.ups    = nn.ModuleList()

        # Create down blocks
        channels = base_channel
        for _ in range(n_layers):
            self.downs.append(Down(channels, channels * 2))
            channels *= 2

        # Create up blocks
        factor = 2 if bilinear else 1
        for _ in range(n_layers):
            self.ups.append(Up(channels, channels // 2 // factor, bilinear))
            channels //= 2

        self.outc = OutConv(channels, out_channels)

        # Random latent variable for input
        self.device = device
        self.vmin = vmin
        self.vmax = vmax
        self.h0, self.w0 = model_shape
        if grf_initialize:
            self.random_latent_vector = self._grf_initialize()
        else:
            self.random_latent_vector = self._random_initialize()
    
    def _random_initialize(self):
        """
        Initializes the random latent vector using uniform random values.

        Returns
        -------
        torch.Tensor
            The initialized random latent vector.
        """
        torch.manual_seed(1234)
        return torch.rand(1, 1, self.h0, self.w0).to(self.device)
    
    def _grf_initialize(self):
        """
        Initializes the random latent vector using a Gaussian random field.

        Returns
        -------
        torch.Tensor
            The initialized random latent vector.
        """
        return generate_grf(self.model_shape, self.grf_alpha, device=self.device).unsqueeze(0).unsqueeze(0)

[docs]    def forward(self):
        """
        Forward pass of the UNet model.

        Returns
        -------
        torch.Tensor
            The output tensor after processing through the UNet.
        """
        x = self.random_latent_vector
        x1 = self.inc(x)

        downs_outputs = [x1]
        for down in self.downs:
            downs_outputs.append(down(downs_outputs[-1]))

        x = downs_outputs[-1]
        for i in range(len(self.ups)):
            x = self.ups[i](x, downs_outputs[-2-i])

        out = self.outc(x)
        out = torch.squeeze(out)
        if self.vmin is not None and self.vmax is not None:
            out = ((self.vmax - self.vmin) * torch.tanh(out) + (self.vmax + self.vmin)) / 2
        out = torch.squeeze(out) * self.unit
        return out