# Author: Chunyang Wang
# GitHub Username: acse-cw1722
import os
import sys
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch_geometric.nn import GATv2Conv, MessagePassing
cur_dir = os.path.dirname(__file__)
sys.path.append(cur_dir)
from extractor import ( # noqa: E402
GlobalFeatExtractor,
LocalFeatExtractor,
)
__all__ = ["MRNAtten"]
[docs]
class RecurrentGATConv(MessagePassing):
"""
Implements a Recurrent Graph Attention Network (GAT) Convolution layer.
Attributes:
to_hidden (GATv2Conv): Graph Attention layer.
to_coord (nn.Sequential): Output layer for coordinates.
activation (nn.SELU): Activation function.
"""
def __init__(self, coord_size=2, hidden_size=512, heads=6, concat=False):
super(RecurrentGATConv, self).__init__()
# GAT layer
self.to_hidden = GATv2Conv(
in_channels=coord_size + hidden_size,
out_channels=hidden_size,
heads=heads,
concat=concat,
)
# output coord layer
self.to_coord = nn.Sequential(
nn.Linear(hidden_size, 2),
)
# activation function
self.activation = nn.SELU()
[docs]
def forward(self, coord, hidden_state, edge_index):
# find boundary
self.find_boundary(coord)
# Recurrent GAT
in_feat = torch.cat((coord, hidden_state), dim=1)
hidden = self.to_hidden(in_feat, edge_index)
hidden = self.activation(hidden)
output_coord = self.to_coord(hidden)
# fix boundary
self.fix_boundary(output_coord)
return output_coord, hidden
[docs]
def find_boundary(self, in_data):
self.upper_node_idx = in_data[:, 0] == 1
self.down_node_idx = in_data[:, 0] == 0
self.left_node_idx = in_data[:, 1] == 0
self.right_node_idx = in_data[:, 1] == 1
[docs]
def fix_boundary(self, in_data):
in_data[self.upper_node_idx, 0] = 1
in_data[self.down_node_idx, 0] = 0
in_data[self.left_node_idx, 1] = 0
in_data[self.right_node_idx, 1] = 1
[docs]
class MRNAtten(torch.nn.Module):
"""
Mesh Refinement Network (MRN) with self attention implementing global and local feature
extraction
and recurrent graph-based deformations.
Attributes:
num_loop (int): Number of loops for the recurrent layer.
gfe_out_c (int): Output channels for global feature extractor.
lfe_out_c (int): Output channels for local feature extractor.
hidden_size (int): Size of the hidden layer.
gfe (GlobalFeatExtractor): Global feature extractor.
lfe (LocalFeatExtractor): Local feature extractor.
lin (nn.Linear): Linear layer for feature transformation.
deformer (RecurrentGATConv): GAT-based deformer block.
"""
def __init__(self, gfe_in_c=2, lfe_in_c=4, deform_in_c=7, num_loop=3):
"""
Initialize MRN.
Args:
gfe_in_c (int): Input channels for the global feature extractor.
lfe_in_c (int): Input channels for the local feature extractor.
deform_in_c (int): Input channels for the deformer block.
num_loop (int): Number of loops for the recurrent layer.
"""
super().__init__()
self.num_loop = num_loop
self.gfe_out_c = 16
self.lfe_out_c = 16
self.hidden_size = 512 # set here
# minus 2 because we are not using x,y coord (first 2 channels)
self.all_feat_c = (deform_in_c - 2) + self.gfe_out_c + self.lfe_out_c
self.gfe = GlobalFeatExtractor(in_c=gfe_in_c, out_c=self.gfe_out_c)
self.lfe = LocalFeatExtractor(num_feat=lfe_in_c, out=self.lfe_out_c)
# =======================================================
# Define the self attention layer
self.embed_dim = 512
self.num_heads = 1
self.dense_dim = 512
assert self.embed_dim % self.num_heads == 0
self.atten = nn.MultiheadAttention(
embed_dim=self.embed_dim,
dropout=0.1,
num_heads=self.num_heads,
batch_first=True,
)
self.pre_attn_norm = nn.LayerNorm(self.embed_dim)
self.post_attn_norm = nn.LayerNorm(self.embed_dim)
self.post_attn_dropout = nn.Dropout(0.1)
self.act_dropout = nn.Dropout(0.1)
self.dense_1 = nn.Linear(self.embed_dim, self.dense_dim)
self.dense_2 = nn.Linear(self.dense_dim, self.embed_dim)
self.pre_dense_norm = nn.LayerNorm(self.embed_dim)
self.post_dense_norm = nn.LayerNorm(self.dense_dim)
activation = "GELU"
self.activation = getattr(nn, activation)()
# =======================================================
# use a linear layer to transform the input feature to hidden
# state size
self.lin = nn.Linear(self.all_feat_c, self.hidden_size)
self.deformer = RecurrentGATConv(
coord_size=2, hidden_size=self.hidden_size, heads=6, concat=False
)
# self.deformer = GATDeformerBlock(in_dim=self.deformer_in_feat)
[docs]
def move(self, data, num_step=1):
"""
Move the mesh according to the deformation learned, with given number
steps.
Args:
data (Data): Input data object containing mesh and feature info.
num_step (int): Number of deformation steps.
Returns:
coord (Tensor): Deformed coordinates.
"""
coord = data.x[:, :2] # [num_nodes * batch_size, 2]
conv_feat_in = data.conv_feat # [batch_size, feat, grid, grid]
mesh_feat = data.mesh_feat # [num_nodes * batch_size, 2]
edge_idx = data.edge_index # [num_edges * batch_size, 2]
node_num = data.node_num
batch_size = data.conv_feat.shape[0]
conv_feat = self.gfe(conv_feat_in)
conv_feat = conv_feat.repeat_interleave(node_num.reshape(-1), dim=0)
local_feat = self.lfe(mesh_feat, edge_idx)
hidden_in = torch.cat([data.x[:, 2:], local_feat, conv_feat], dim=1)
hidden = F.selu(self.lin(hidden_in))
# Reshape back to [batch size, node num, feature dim] for transformer
feat_dim = hidden.shape[-1]
hidden = hidden.reshape(batch_size, -1, feat_dim)
# =======================================================
# A transformer encoder block
residual = hidden
hidden = self.pre_attn_norm(hidden)
# compute self-attention
hidden, atten_scores = self.atten(hidden, hidden, hidden)
hidden = self.post_attn_norm(hidden) # TODO: This seems to be optional
hidden = self.post_attn_dropout(hidden)
hidden = hidden + residual
residual = hidden
hidden = self.pre_dense_norm(hidden)
hidden = self.activation(self.dense_1(hidden))
hidden = self.act_dropout(hidden)
hidden = self.post_dense_norm(hidden) # TODO: This seems to be optional
hidden = self.dense_2(hidden)
hidden = self.post_attn_dropout(hidden)
hidden = hidden + residual
# =======================================================
# Reshape to [batch size * node num, feature dim] for pyG
bs, node_num = hidden.shape[0], hidden.shape[1]
hidden = hidden.reshape(bs * node_num, -1)
# Recurrent GAT deform
for i in range(num_step):
coord, hidden = self.deformer(coord, hidden, edge_idx)
return coord
[docs]
def forward(self, data):
"""
Forward pass for MRN.
Args:
data (Data): Input data object containing mesh and feature info.
Returns:
coord (Tensor): Deformed coordinates.
"""
coord = data.x[:, :2] # [num_nodes * batch_size, 2]
conv_feat_in = data.conv_feat # [batch_size, feat, grid, grid]
batch_size = conv_feat_in.shape[0]
mesh_feat = data.mesh_feat # [num_nodes * batch_size, 2]
edge_idx = data.edge_index # [num_edges * batch_size, 2]
node_num = data.node_num
conv_feat = self.gfe(conv_feat_in)
conv_feat = conv_feat.repeat_interleave(node_num.reshape(-1), dim=0)
local_feat = self.lfe(mesh_feat, edge_idx)
hidden_in = torch.cat([data.x[:, 2:], local_feat, conv_feat], dim=1)
hidden = F.selu(self.lin(hidden_in))
# print(hidden.shape, hidden_in.shape, local_feat.shape, conv_feat.shape)
# Reshape back to [batch size, node num, feature dim] for transformer
feat_dim = hidden.shape[-1]
hidden = hidden.reshape(batch_size, -1, feat_dim)
# =======================================================
# A transformer encoder block
residual = hidden
hidden = self.pre_attn_norm(hidden)
# compute self-attention
hidden, atten_scores = self.atten(hidden, hidden, hidden)
hidden = self.post_attn_norm(hidden) # TODO: This seems to be optional
hidden = self.post_attn_dropout(hidden)
hidden = hidden + residual
residual = hidden
hidden = self.pre_dense_norm(hidden)
hidden = self.activation(self.dense_1(hidden))
hidden = self.act_dropout(hidden)
hidden = self.post_dense_norm(hidden) # TODO: This seems to be optional
hidden = self.dense_2(hidden)
hidden = self.post_attn_dropout(hidden)
hidden = hidden + residual
# =======================================================
# Reshape to [batch size * node num, feature dim] for pyG
bs, node_num = hidden.shape[0], hidden.shape[1]
hidden = hidden.reshape(bs * node_num, -1)
# Recurrent GAT deform
for i in range(self.num_loop):
coord, hidden = self.deformer(coord, hidden, edge_idx)
return coord