DAMO-NLP-SG
/

zero-shot-classify-SSTuning-large

Zero-Shot Classification

text-classification

Zero-Shot Classification

Model card Files Files and versions Community

lukecq commited on May 28, 2023

Commit

459852d

·

1 Parent(s): d334121

Update README.md

Files changed (1) hide show

README.md +21 -13

README.md CHANGED Viewed

@@ -49,31 +49,39 @@ You can try the model with the Colab [Notebook](https://colab.research.google.co
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import torch, string, random
-tokenizer = AutoTokenizer.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-base")
-model = AutoModelForSequenceClassification.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-base")
 text = "I love this place! The food is always so fresh and delicious."
 list_label = ["negative", "positive"]
 list_ABC = [x for x in string.ascii_uppercase]
-def add_prefix(text, list_label, shuffle = False):
     list_label = [x+'.' if x[-1] != '.' else x for x in list_label]
     list_label_new = list_label + [tokenizer.pad_token]* (20 - len(list_label))
     if shuffle:
         random.shuffle(list_label_new)
     s_option = ' '.join(['('+list_ABC[i]+') '+list_label_new[i] for i in range(len(list_label_new))])
-    return f'{s_option} {tokenizer.sep_token} {text}', list_label_new
-text_new, list_label_new = add_prefix(text,list_label,shuffle=False)
-encoding = tokenizer([text_new],truncation=True, padding='max_length',max_length=512, return_tensors='pt')
-with torch.no_grad():
-    logits = model(**encoding).logits
     probs = torch.nn.functional.softmax(logits, dim = -1).tolist()
-    predictions = torch.argmax(logits, dim=-1)
-print(probs)
-print(predictions)
 ```

 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import torch, string, random
+tokenizer = AutoTokenizer.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-large")
+model = AutoModelForSequenceClassification.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-large")
 text = "I love this place! The food is always so fresh and delicious."
 list_label = ["negative", "positive"]
+device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')
 list_ABC = [x for x in string.ascii_uppercase]
+def check_text(model, text, list_label, shuffle=False):
     list_label = [x+'.' if x[-1] != '.' else x for x in list_label]
     list_label_new = list_label + [tokenizer.pad_token]* (20 - len(list_label))
     if shuffle:
         random.shuffle(list_label_new)
     s_option = ' '.join(['('+list_ABC[i]+') '+list_label_new[i] for i in range(len(list_label_new))])
+    text = f'{s_option} {tokenizer.sep_token} {text}'
+    model.to(device).eval()
+    encoding = tokenizer([text],truncation=True, max_length=512,return_tensors='pt')
+    item = {key: val.to(device) for key, val in encoding.items()}
+    logits = model(**item).logits
+    logits = logits if shuffle else logits[:,0:len(list_label)]
     probs = torch.nn.functional.softmax(logits, dim = -1).tolist()
+    predictions = torch.argmax(logits, dim=-1).item()
+    probabilities = [round(x,5) for x in probs[0]]
+    print(f'prediction:    {predictions} => ({list_ABC[predictions]}) {list_label_new[predictions]}')
+    print(f'probability:   {round(probabilities[predictions]*100,2)}%')
+check_text(model, text, list_label)
+# prediction:    1 => (B) positive.
+# probability:   99.84%
 ```