[#41] add draft asgcn model

aisingapore · Dec 13, 2021 · 549e7fc · 549e7fc
1 parent 436240e
commit 549e7fc
Showing 1 changed file with 64 additions and 1 deletion.
diff --git a/sgnlp/models/sentic_asgcn/modeling.py b/sgnlp/models/sentic_asgcn/modeling.py
@@ -2,6 +2,7 @@
 
 import torch
 import torch.nn as nn
+import torch.nn.functional as F
 from transformers import PreTrainedModel
 from transformers.file_utils import ModelOutput
 
@@ -28,7 +29,7 @@ def _init_weights(self, module):
 
 
 class SenticASGCNModel(SenticASGCNPreTrainedModel):
-    def __init__(self, config: SenticASGCNConfig):
+    def __init__(self, config: SenticASGCNConfig) -> None:
         super().__init__(config)
         self.text_lstm = DynamicLSTM(
             config.embed_dim,
@@ -41,3 +42,65 @@ def __init__(self, config: SenticASGCNConfig):
         self.gc2 = GraphConvolution(2 * config.hidden_dim, 2 * config.hidden_dim)
         self.fc = nn.Linear(2 * config.hidden_dim, config.polarities_dim)
         self.text_embed_dropout = nn.Dropout(config.dropout)
+        self.device = config.device
+
+    def position_weight(self, x, aspect_double_idx, text_len, aspect_len):
+        batch_size = x.shape[0]
+        seq_len = x.shape[1]
+        aspect_double_idx = aspect_double_idx.cpu().numpy()
+        text_len = text_len.cpu().numpy()
+        aspect_len = aspect_len.cpu().numpy()
+        weight = [[] for i in range(batch_size)]
+        for i in range(batch_size):
+            context_len = text_len[i] - aspect_len[i]
+            for j in range(aspect_double_idx[i, 0]):
+                weight[i].append(1 - (aspect_double_idx[i, 0] - j) / context_len)
+            for j in range(aspect_double_idx[i, 0], aspect_double_idx[i, 1] + 1):
+                weight[i].append(0)
+            for j in range(aspect_double_idx[i, 1] + 1, text_len[i]):
+                weight[i].append(1 - (j - aspect_double_idx[i, 1] / context_len))
+            for j in range(text_len[i], seq_len):
+                weight[i].append(0)
+        weight = torch.tensor(weight, dtype=torch.float).unsqueeze(2).to(self.device)
+        return weight * x
+
+    def mask(self, x, aspect_double_idx):
+        batch_size, seq_len = x.shape[0], x.shape[1]
+        aspect_double_idx = aspect_double_idx.cpu().numpy()
+        mask = [[] for i in range(batch_size)]
+        for i in range(batch_size):
+            for j in range(aspect_double_idx[i, 0]):
+                mask[i].append(0)
+            for j in range(aspect_double_idx[i, 0], aspect_double_idx[i, 1] + 1):
+                mask[i].append(1)
+            for j in range(aspect_double_idx[i, 1] + 1, seq_len):
+                mask[i].append(0)
+        mask = torch.tensor(mask, dtype=torch.float).unsqueeze(2).to(self.device)
+        return mask * x
+
+    def forward(self, inputs):
+        text_indices, aspect_indices, left_indices, adj = inputs
+        text_len = torch.sum(text_indices != 0, dim=-1)
+        aspect_len = torch.sum(aspect_indices != 0, dim=-1)
+        left_len = torch.sum(left_indices != 0, dim=-1)
+        aspect_double_idx = torch.cat(
+            [left_len.unsqueeze(1), (left_len + aspect_len - 1).unsqueeze(1)], dim=1
+        )
+        text = self.text_embed_dropout(self.embed(text_indices))
+        text_out, (_, _) = self.text_lstm(text, text_len)
+        x = F.relu(
+            self.gc1(
+                self.position_weight(text_out, aspect_double_idx, text_len, aspect_len),
+                adj,
+            )
+        )
+        x = F.relu(
+            self.gc2(
+                self.position_weight(x, aspect_double_idx, text_len, aspect_len), adj
+            )
+        )
+        alpha_mat = torch.matmul(x, text_out.transpose(1, 2))
+        alpha = F.softmax(alpha_mat.sum(1, keepdim=True), dim=2)
+        x = torch.matmul(alpha, text_out).squeeze(1)  # batch_size x 2 * hidden_dim
+        output = self.fc(x)
+        return output