Mortie1
/

new-nlp-hw3-llama3

Text Generation

Model card Files Files and versions

Mortie1 commited on Nov 12, 2024

Commit

eb80782

·

verified ·

1 Parent(s): 6602da5

Upload MyLLaMa

Files changed (1) hide show

configure_for_hf.py +5 -6

configure_for_hf.py CHANGED Viewed

@@ -64,13 +64,12 @@ class MyLLaMa(PreTrainedModel):
                 -torch.inf,
             )
             .transpose(0, 1)
-            .cuda(),
-        )
-        pad_mask = (
-            torch.where(
-                tensor == self.model.tokenizer.pad_token_id, False, True
-            ).cuda(),
         )
         logits = self.model(tensor, att_mask, pad_mask)["logits"]
         if labels is not None:
             loss = nn.functional.cross_entropy(logits, labels)

                 -torch.inf,
             )
             .transpose(0, 1)
+            .cuda()
         )
+        pad_mask = torch.where(
+            tensor == self.model.tokenizer.pad_token_id, False, True
+        ).cuda()
         logits = self.model(tensor, att_mask, pad_mask)["logits"]
         if labels is not None:
             loss = nn.functional.cross_entropy(logits, labels)