Using nn.Conv Convolutions in ResidualConvBlock

mikesol · May 23, 2024, 3:45am

In the Diffusion course, they use the ResidualConvBlock pasted below. In the forward pass, there’s a 1x1 nn.Conv2d created at every iteration. Before reading this code, I’d only ever seen layers defined in __init__ and then used in forward. Could someone please help me understand when & why a 1x1 convolution would be defined in the forward pass? Thank you

class ResidualConvBlock(nn.Module):
    def __init__(
        self, in_channels: int, out_channels: int, is_res: bool = False
    ) -> None:
        super().__init__()

        # Check if input and output channels are the same for the residual connection
        self.same_channels = in_channels == out_channels

        # Flag for whether or not to use residual connection
        self.is_res = is_res

        # First convolutional layer
        self.conv1 = nn.Sequential(
            nn.Conv2d(in_channels, out_channels, 3, 1, 1),   # 3x3 kernel with stride 1 and padding 1
            nn.BatchNorm2d(out_channels),   # Batch normalization
            nn.GELU(),   # GELU activation function
        )

        # Second convolutional layer
        self.conv2 = nn.Sequential(
            nn.Conv2d(out_channels, out_channels, 3, 1, 1),   # 3x3 kernel with stride 1 and padding 1
            nn.BatchNorm2d(out_channels),   # Batch normalization
            nn.GELU(),   # GELU activation function
        )

    def forward(self, x: torch.Tensor) -> torch.Tensor:

        # If using residual connection
        if self.is_res:
            # Apply first convolutional layer
            x1 = self.conv1(x)

            # Apply second convolutional layer
            x2 = self.conv2(x1)

            # If input and output channels are the same, add residual connection directly
            if self.same_channels:
                out = x + x2
            else:
                # If not, apply a 1x1 convolutional layer to match dimensions before adding residual connection
                shortcut = nn.Conv2d(x.shape[1], x2.shape[1], kernel_size=1, stride=1, padding=0).to(x.device)
                out = shortcut(x) + x2
            #print(f"resconv forward: x {x.shape}, x1 {x1.shape}, x2 {x2.shape}, out {out.shape}")

            # Normalize output tensor
            return out / 1.414

        # If not using residual connection, return output of second convolutional layer
        else:
            x1 = self.conv1(x)
            x2 = self.conv2(x1)
            return x2

    # Method to get the number of output channels for this block
    def get_out_channels(self):
        return self.conv2[0].out_channels

    # Method to set the number of output channels for this block
    def set_out_channels(self, out_channels):
        self.conv1[0].out_channels = out_channels
        self.conv2[0].in_channels = out_channels
        self.conv2[0].out_channels = out_channels

Topic		Replies	Views
Convolutional Neural Networks - Forward Pass Convolutional Neural Networks coursera-platform	7	611	March 24, 2022
C4 W1 CNN Forward Pass : conv_forward (Dimensions) Convolutional Neural Networks coursera-platform	11	1051	August 13, 2021
Course 4, Week 1 - conv_forward Convolutional Neural Networks coursera-platform	1	666	August 14, 2021
Residual layers explained Convolutional Neural Networks coursera-platform	2	545	May 8, 2023
Residual Nets Question Custom Models, Layers and Loss Functions with TF week-4	6	635	November 15, 2023

Using nn.Conv Convolutions in ResidualConvBlock

Related topics