Source code for UM2N.model.MRN_atten

# Author: Chunyang Wang
# GitHub Username: acse-cw1722

import os
import sys

import torch
import torch.nn as nn
import torch.nn.functional as F
from torch_geometric.nn import GATv2Conv, MessagePassing

cur_dir = os.path.dirname(__file__)
sys.path.append(cur_dir)
from extractor import (  # noqa: E402
    GlobalFeatExtractor,
    LocalFeatExtractor,
)

__all__ = ["MRNAtten"]


class RecurrentGATConv(MessagePassing):
    """
    Implements a Recurrent Graph Attention Network (GAT) Convolution layer.

    Attributes:
        to_hidden (GATv2Conv): Graph Attention layer.
        to_coord (nn.Sequential): Output layer for coordinates.
        activation (nn.SELU): Activation function.
    """

    def __init__(self, coord_size=2, hidden_size=512, heads=6, concat=False):
        super(RecurrentGATConv, self).__init__()
        # GAT layer
        self.to_hidden = GATv2Conv(
            in_channels=coord_size + hidden_size,
            out_channels=hidden_size,
            heads=heads,
            concat=concat,
        )
        # output coord layer
        self.to_coord = nn.Sequential(
            nn.Linear(hidden_size, 2),
        )
        # activation function
        self.activation = nn.SELU()

    def forward(self, coord, hidden_state, edge_index):
        # find boundary
        self.find_boundary(coord)
        # Recurrent GAT
        in_feat = torch.cat((coord, hidden_state), dim=1)
        hidden = self.to_hidden(in_feat, edge_index)
        hidden = self.activation(hidden)
        output_coord = self.to_coord(hidden)
        # fix boundary
        self.fix_boundary(output_coord)
        return output_coord, hidden

    def find_boundary(self, in_data):
        self.upper_node_idx = in_data[:, 0] == 1
        self.down_node_idx = in_data[:, 0] == 0
        self.left_node_idx = in_data[:, 1] == 0
        self.right_node_idx = in_data[:, 1] == 1

    def fix_boundary(self, in_data):
        in_data[self.upper_node_idx, 0] = 1
        in_data[self.down_node_idx, 0] = 0
        in_data[self.left_node_idx, 1] = 0
        in_data[self.right_node_idx, 1] = 1



[docs]
class MRNAtten(torch.nn.Module):
    """
    Mesh Refinement Network (MRN) with self attention implementing global and local feature
        extraction
    and recurrent graph-based deformations.

    Attributes:
        num_loop (int): Number of loops for the recurrent layer.
        gfe_out_c (int): Output channels for global feature extractor.
        lfe_out_c (int): Output channels for local feature extractor.
        hidden_size (int): Size of the hidden layer.
        gfe (GlobalFeatExtractor): Global feature extractor.
        lfe (LocalFeatExtractor): Local feature extractor.
        lin (nn.Linear): Linear layer for feature transformation.
        deformer (RecurrentGATConv): GAT-based deformer block.
    """

    def __init__(self, gfe_in_c=2, lfe_in_c=4, deform_in_c=7, num_loop=3):
        """
        Initialize MRN.

        Args:
            gfe_in_c (int): Input channels for the global feature extractor.
            lfe_in_c (int): Input channels for the local feature extractor.
            deform_in_c (int): Input channels for the deformer block.
            num_loop (int): Number of loops for the recurrent layer.
        """
        super().__init__()
        self.num_loop = num_loop
        self.gfe_out_c = 16
        self.lfe_out_c = 16
        self.hidden_size = 512  # set here
        # minus 2 because we are not using x,y coord (first 2 channels)
        self.all_feat_c = (deform_in_c - 2) + self.gfe_out_c + self.lfe_out_c

        self.gfe = GlobalFeatExtractor(in_c=gfe_in_c, out_c=self.gfe_out_c)
        self.lfe = LocalFeatExtractor(num_feat=lfe_in_c, out=self.lfe_out_c)

        # =======================================================
        # Define the self attention layer
        self.embed_dim = 512
        self.num_heads = 1
        self.dense_dim = 512
        assert self.embed_dim % self.num_heads == 0
        self.atten = nn.MultiheadAttention(
            embed_dim=self.embed_dim,
            dropout=0.1,
            num_heads=self.num_heads,
            batch_first=True,
        )
        self.pre_attn_norm = nn.LayerNorm(self.embed_dim)
        self.post_attn_norm = nn.LayerNorm(self.embed_dim)
        self.post_attn_dropout = nn.Dropout(0.1)
        self.act_dropout = nn.Dropout(0.1)
        self.dense_1 = nn.Linear(self.embed_dim, self.dense_dim)
        self.dense_2 = nn.Linear(self.dense_dim, self.embed_dim)
        self.pre_dense_norm = nn.LayerNorm(self.embed_dim)
        self.post_dense_norm = nn.LayerNorm(self.dense_dim)
        activation = "GELU"
        self.activation = getattr(nn, activation)()
        # =======================================================

        # use a linear layer to transform the input feature to hidden
        # state size
        self.lin = nn.Linear(self.all_feat_c, self.hidden_size)
        self.deformer = RecurrentGATConv(
            coord_size=2, hidden_size=self.hidden_size, heads=6, concat=False
        )
        # self.deformer = GATDeformerBlock(in_dim=self.deformer_in_feat)


[docs]
    def move(self, data, num_step=1):
        """
        Move the mesh according to the deformation learned, with given number
            steps.

        Args:
            data (Data): Input data object containing mesh and feature info.
            num_step (int): Number of deformation steps.

        Returns:
            coord (Tensor): Deformed coordinates.
        """
        coord = data.x[:, :2]  # [num_nodes * batch_size, 2]
        conv_feat_in = data.conv_feat  # [batch_size, feat, grid, grid]
        mesh_feat = data.mesh_feat  # [num_nodes * batch_size, 2]
        edge_idx = data.edge_index  # [num_edges * batch_size, 2]
        node_num = data.node_num
        batch_size = data.conv_feat.shape[0]

        conv_feat = self.gfe(conv_feat_in)
        conv_feat = conv_feat.repeat_interleave(node_num.reshape(-1), dim=0)

        local_feat = self.lfe(mesh_feat, edge_idx)

        hidden_in = torch.cat([data.x[:, 2:], local_feat, conv_feat], dim=1)
        hidden = F.selu(self.lin(hidden_in))

        # Reshape back to [batch size, node num, feature dim] for transformer
        feat_dim = hidden.shape[-1]
        hidden = hidden.reshape(batch_size, -1, feat_dim)
        # =======================================================
        # A transformer encoder block
        residual = hidden
        hidden = self.pre_attn_norm(hidden)
        # compute self-attention
        hidden, atten_scores = self.atten(hidden, hidden, hidden)
        hidden = self.post_attn_norm(hidden)  # TODO: This seems to be optional
        hidden = self.post_attn_dropout(hidden)
        hidden = hidden + residual

        residual = hidden
        hidden = self.pre_dense_norm(hidden)
        hidden = self.activation(self.dense_1(hidden))
        hidden = self.act_dropout(hidden)

        hidden = self.post_dense_norm(hidden)  # TODO: This seems to be optional

        hidden = self.dense_2(hidden)
        hidden = self.post_attn_dropout(hidden)
        hidden = hidden + residual
        # =======================================================

        # Reshape to [batch size * node num, feature dim] for pyG
        bs, node_num = hidden.shape[0], hidden.shape[1]
        hidden = hidden.reshape(bs * node_num, -1)

        # Recurrent GAT deform
        for i in range(num_step):
            coord, hidden = self.deformer(coord, hidden, edge_idx)

        return coord



[docs]
    def forward(self, data):
        """
        Forward pass for MRN.

        Args:
            data (Data): Input data object containing mesh and feature info.

        Returns:
            coord (Tensor): Deformed coordinates.
        """
        coord = data.x[:, :2]  # [num_nodes * batch_size, 2]
        conv_feat_in = data.conv_feat  # [batch_size, feat, grid, grid]
        batch_size = conv_feat_in.shape[0]
        mesh_feat = data.mesh_feat  # [num_nodes * batch_size, 2]
        edge_idx = data.edge_index  # [num_edges * batch_size, 2]
        node_num = data.node_num

        conv_feat = self.gfe(conv_feat_in)
        conv_feat = conv_feat.repeat_interleave(node_num.reshape(-1), dim=0)

        local_feat = self.lfe(mesh_feat, edge_idx)

        hidden_in = torch.cat([data.x[:, 2:], local_feat, conv_feat], dim=1)
        hidden = F.selu(self.lin(hidden_in))
        # print(hidden.shape, hidden_in.shape, local_feat.shape, conv_feat.shape)

        # Reshape back to [batch size, node num, feature dim] for transformer
        feat_dim = hidden.shape[-1]
        hidden = hidden.reshape(batch_size, -1, feat_dim)
        # =======================================================
        # A transformer encoder block
        residual = hidden
        hidden = self.pre_attn_norm(hidden)
        # compute self-attention
        hidden, atten_scores = self.atten(hidden, hidden, hidden)
        hidden = self.post_attn_norm(hidden)  # TODO: This seems to be optional
        hidden = self.post_attn_dropout(hidden)
        hidden = hidden + residual

        residual = hidden
        hidden = self.pre_dense_norm(hidden)
        hidden = self.activation(self.dense_1(hidden))
        hidden = self.act_dropout(hidden)

        hidden = self.post_dense_norm(hidden)  # TODO: This seems to be optional

        hidden = self.dense_2(hidden)
        hidden = self.post_attn_dropout(hidden)
        hidden = hidden + residual
        # =======================================================

        # Reshape to [batch size * node num, feature dim] for pyG
        bs, node_num = hidden.shape[0], hidden.shape[1]
        hidden = hidden.reshape(bs * node_num, -1)

        # Recurrent GAT deform
        for i in range(self.num_loop):
            coord, hidden = self.deformer(coord, hidden, edge_idx)

        return coord