cshin23
/

multidim-rm_reg_gating_prototype

Text Classification

pytorch_model_hub_mixin

model_hub_mixin

Model card Files Files and versions

cshin23 commited on Jul 26, 2024

Commit

37f71e0

·

verified ·

1 Parent(s): 24aceef

Create modeling_custom.py

Files changed (1) hide show

modeling_custom.py +29 -0

modeling_custom.py ADDED Viewed

	@@ -0,0 +1,29 @@

+from torch import nn
+from huggingface_hub import PyTorchModelHubMixin
+class GatedRegressionModel(nn.Module, PyTorchModelHubMixin):
+    def __init__(self, base_model):
+        super().__init__()
+        self.base_model = base_model
+        self.hidden_dim = 1024
+        self.gate_model = nn.ModuleList([
+            nn.Linear(self.base_model.pre_classifier.out_features, self.hidden_dim, bias=True),
+            nn.GELU(),
+            nn.Dropout(p=0.2),
+            nn.Linear(self.hidden_dim, self.hidden_dim, bias=True),
+            nn.GELU(),
+            nn.Dropout(p=0.2),
+            nn.Linear(self.hidden_dim, 1, bias=True),
+            nn.GELU(),
+            nn.Dropout(p=0.2),
+        ])
+    def forward(self, input_ids, attention_mask):
+        o = self.base_model.distilbert(input_ids=input_ids, attention_mask=attention_mask)[0][:, 0] # encoder-decoder architecture
+        o = self.base_model.pre_classifier(o)
+        scores = self.base_model.classifier(o)
+        gate = o
+        for layer in self.gate_model:
+            gate = layer(gate)
+        return (gate * scores).sum(axis=1)