sxtforreal
/

CHOPT

Feature Extraction

English

NLP

Model card Files Files and versions Community

sxtforreal commited on Mar 6, 2024

Commit

7f4f2d3

verified ·

1 Parent(s): 504db9e

Create loss.py

Browse files

This file holds 4 loss functions for the 4 models respectively.

Files changed (1) hide show

loss.py +228 -0

loss.py ADDED Viewed

	@@ -0,0 +1,228 @@

+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import config
+class ContrastiveLoss_simcse(nn.Module):
+    """SimCSE loss"""
+    def __init__(self):
+        super(ContrastiveLoss_simcse, self).__init__()
+        self.temperature = config.temperature
+    def forward(self, feature_vectors, labels):
+        normalized_features = F.normalize(
+            feature_vectors, p=2, dim=0
+        )  # normalize along columns
+        # Identify indices for each label
+        anchor_indices = (labels == 0).nonzero().squeeze(dim=1)
+        positive_indices = (labels == 1).nonzero().squeeze(dim=1)
+        negative_indices = (labels == 2).nonzero().squeeze(dim=1)
+        # Extract tensors based on labels
+        anchor = normalized_features[anchor_indices]
+        positives = normalized_features[positive_indices]
+        negatives = normalized_features[negative_indices]
+        pos_and_neg = torch.cat([positives, negatives])
+        denominator = torch.sum(
+            torch.exp(
+                torch.div(
+                    torch.matmul(anchor, torch.transpose(pos_and_neg, 0, 1)),
+                    self.temperature,
+                )
+            )
+        )
+        numerator = torch.exp(
+            torch.div(
+                torch.matmul(anchor, torch.transpose(positives, 0, 1)),
+                self.temperature,
+            )
+        )
+        loss = -torch.log(
+            torch.div(
+                numerator,
+                denominator,
+            )
+        )
+        return loss
+class ContrastiveLoss_simcse_w(nn.Module):
+    """SimCSE loss with weighting."""
+    def __init__(self):
+        super(ContrastiveLoss_simcse_w, self).__init__()
+        self.temperature = config.temperature
+    def forward(self, feature_vectors, labels, scores):
+        normalized_features = F.normalize(
+            feature_vectors, p=2, dim=0
+        )  # normalize along columns
+        # Identify indices for each label
+        anchor_indices = (labels == 0).nonzero().squeeze(dim=1)
+        positive_indices = (labels == 1).nonzero().squeeze(dim=1)
+        negative_indices = (labels == 2).nonzero().squeeze(dim=1)
+        pos_scores = scores[positive_indices].float()
+        normalized_neg_scores = F.normalize(
+            scores[negative_indices].float(), p=2, dim=0
+        )  # l2-norm
+        normalized_neg_scores += 1
+        scores = torch.cat([pos_scores, normalized_neg_scores])
+        # Extract tensors based on labels
+        anchor = normalized_features[anchor_indices]
+        positives = normalized_features[positive_indices]
+        negatives = normalized_features[negative_indices]
+        pos_and_neg = torch.cat([positives, negatives])
+        denominator = torch.sum(
+            torch.exp(
+                scores
+                * torch.div(
+                    torch.matmul(anchor, torch.transpose(pos_and_neg, 0, 1)),
+                    self.temperature,
+                )
+            )
+        )
+        numerator = torch.exp(
+            torch.div(
+                torch.matmul(anchor, torch.transpose(positives, 0, 1)),
+                self.temperature,
+            )
+        )
+        loss = -torch.log(
+            torch.div(
+                numerator,
+                denominator,
+            )
+        )
+        return loss
+class ContrastiveLoss_samp(nn.Module):
+    """Supervised contrastive loss without weighting."""
+    def __init__(self):
+        super(ContrastiveLoss_samp, self).__init__()
+        self.temperature = config.temperature
+    def forward(self, feature_vectors, labels):
+        # Normalize feature vectors
+        normalized_features = F.normalize(
+            feature_vectors, p=2, dim=0
+        )  # normalize along columns
+        # Identify indices for each label
+        anchor_indices = (labels == 0).nonzero().squeeze(dim=1)
+        positive_indices = (labels == 1).nonzero().squeeze(dim=1)
+        negative_indices = (labels == 2).nonzero().squeeze(dim=1)
+        # Extract tensors based on labels
+        anchor = normalized_features[anchor_indices]
+        positives = normalized_features[positive_indices]
+        negatives = normalized_features[negative_indices]
+        pos_and_neg = torch.cat([positives, negatives])
+        pos_cardinal = positives.shape[0]
+        denominator = torch.sum(
+            torch.exp(
+                torch.div(
+                    torch.matmul(anchor, torch.transpose(pos_and_neg, 0, 1)),
+                    self.temperature,
+                )
+            )
+        )
+        sum_log_ent = torch.sum(
+            torch.log(
+                torch.div(
+                    torch.exp(
+                        torch.div(
+                            torch.matmul(anchor, torch.transpose(positives, 0, 1)),
+                            self.temperature,
+                        )
+                    ),
+                    denominator,
+                )
+            )
+        )
+        scale = -1 / pos_cardinal
+        return scale * sum_log_ent
+class ContrastiveLoss_samp_w(nn.Module):
+    """Supervised contrastive loss with weighting."""
+    def __init__(self):
+        super(ContrastiveLoss_samp_w, self).__init__()
+        self.temperature = config.temperature
+    def forward(self, feature_vectors, labels, scores):
+        # Normalize feature vectors
+        normalized_features = F.normalize(
+            feature_vectors, p=2, dim=0
+        )  # normalize along columns
+        # Identify indices for each label
+        anchor_indices = (labels == 0).nonzero().squeeze(dim=1)
+        positive_indices = (labels == 1).nonzero().squeeze(dim=1)
+        negative_indices = (labels == 2).nonzero().squeeze(dim=1)
+        # Normalize score vector
+        num_skip = len(positive_indices) + 1
+        pos_scores = scores[: (num_skip - 1)].float()  # exclude anchor
+        normalized_neg_scores = F.normalize(
+            scores[num_skip:].float(), p=2, dim=0
+        )  # l2-norm
+        normalized_neg_scores += 1
+        scores = torch.cat([pos_scores, normalized_neg_scores])
+        # Extract tensors based on labels
+        anchor = normalized_features[anchor_indices]
+        positives = normalized_features[positive_indices]
+        negatives = normalized_features[negative_indices]
+        pos_and_neg = torch.cat([positives, negatives])
+        pos_cardinal = positives.shape[0]
+        denominator = torch.sum(
+            torch.exp(
+                scores
+                * torch.div(
+                    torch.matmul(anchor, torch.transpose(pos_and_neg, 0, 1)),
+                    self.temperature,
+                )
+            )
+        )
+        sum_log_ent = torch.sum(
+            torch.log(
+                torch.div(
+                    torch.exp(
+                        torch.div(
+                            torch.matmul(anchor, torch.transpose(positives, 0, 1)),
+                            self.temperature,
+                        )
+                    ),
+                    denominator,
+                )
+            )
+        )
+        scale = -1 / pos_cardinal
+        return scale * sum_log_ent