DAMO-NLP-SG
/

zero-shot-classify-SSTuning-ALBERT

@@ -31,8 +31,7 @@ There are three versions of models released. The details are:
 |------------|-----------|----------|-------|-------|----|
 |   [zero-shot-classify-SSTuning-base](https://huggingface.co/DAMO-NLP-SG/zero-shot-classify-SSTuning-base)    |  [roberta-base](https://huggingface.co/roberta-base)      |  125M    |  Low    |  High    | 20.48M |
 |   [zero-shot-classify-SSTuning-large](https://huggingface.co/DAMO-NLP-SG/zero-shot-classify-SSTuning-large)    |    [roberta-large](https://huggingface.co/roberta-large)      | 355M     |   Medium   | Medium | 5.12M |
-|   [zero-shot-classify-SSTuning-ALBERT](https://huggingface.co/DAMO-NLP-SG/zero-shot-classify-SSTuning-ALBERT)
-   |  [albert-xxlarge-v2](https://huggingface.co/albert-xxlarge-v2)      |  235M   |    High  | Low| 5.12M |
 Please note that zero-shot-classify-SSTuning-base is trained with more data (20.48M) than the paper, as this will increase the accuracy.
@@ -49,31 +48,39 @@ You can try the model with the Colab [Notebook](https://colab.research.google.co
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import torch, string, random
-tokenizer = AutoTokenizer.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-base")
-model = AutoModelForSequenceClassification.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-base")
 text = "I love this place! The food is always so fresh and delicious."
 list_label = ["negative", "positive"]
 list_ABC = [x for x in string.ascii_uppercase]
-def add_prefix(text, list_label, shuffle = False):
     list_label = [x+'.' if x[-1] != '.' else x for x in list_label]
     list_label_new = list_label + [tokenizer.pad_token]* (20 - len(list_label))
     if shuffle:
         random.shuffle(list_label_new)
     s_option = ' '.join(['('+list_ABC[i]+') '+list_label_new[i] for i in range(len(list_label_new))])
-    return f'{s_option} {tokenizer.sep_token} {text}', list_label_new
-text_new, list_label_new = add_prefix(text,list_label,shuffle=False)
-encoding = tokenizer([text_new],truncation=True, padding='max_length',max_length=512, return_tensors='pt')
-with torch.no_grad():
-    logits = model(**encoding).logits
     probs = torch.nn.functional.softmax(logits, dim = -1).tolist()
-    predictions = torch.argmax(logits, dim=-1)
-print(probs)
-print(predictions)
 ```

 |------------|-----------|----------|-------|-------|----|
 |   [zero-shot-classify-SSTuning-base](https://huggingface.co/DAMO-NLP-SG/zero-shot-classify-SSTuning-base)    |  [roberta-base](https://huggingface.co/roberta-base)      |  125M    |  Low    |  High    | 20.48M |
 |   [zero-shot-classify-SSTuning-large](https://huggingface.co/DAMO-NLP-SG/zero-shot-classify-SSTuning-large)    |    [roberta-large](https://huggingface.co/roberta-large)      | 355M     |   Medium   | Medium | 5.12M |
+|   [zero-shot-classify-SSTuning-ALBERT](https://huggingface.co/DAMO-NLP-SG/zero-shot-classify-SSTuning-ALBERT) |  [albert-xxlarge-v2](https://huggingface.co/albert-xxlarge-v2)      |  235M   |    High  | Low| 5.12M |
 Please note that zero-shot-classify-SSTuning-base is trained with more data (20.48M) than the paper, as this will increase the accuracy.
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import torch, string, random
+tokenizer = AutoTokenizer.from_pretrained("albert-xxlarge-v2")
+model = AutoModelForSequenceClassification.from_pretrained("DAMO-NLP-SG/zero-shot-classify-SSTuning-ALBERT")
 text = "I love this place! The food is always so fresh and delicious."
 list_label = ["negative", "positive"]
+device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')
 list_ABC = [x for x in string.ascii_uppercase]
+def check_text(model, text, list_label, shuffle=False):
     list_label = [x+'.' if x[-1] != '.' else x for x in list_label]
     list_label_new = list_label + [tokenizer.pad_token]* (20 - len(list_label))
     if shuffle:
         random.shuffle(list_label_new)
     s_option = ' '.join(['('+list_ABC[i]+') '+list_label_new[i] for i in range(len(list_label_new))])
+    text = f'{s_option} {tokenizer.sep_token} {text}'
+    model.to(device).eval()
+    encoding = tokenizer([text],truncation=True, max_length=512,return_tensors='pt')
+    item = {key: val.to(device) for key, val in encoding.items()}
+    logits = model(**item).logits
+    logits = logits if shuffle else logits[:,0:len(list_label)]
     probs = torch.nn.functional.softmax(logits, dim = -1).tolist()
+    predictions = torch.argmax(logits, dim=-1).item()
+    probabilities = [round(x,5) for x in probs[0]]
+    print(f'prediction:    {predictions} => ({list_ABC[predictions]}) {list_label_new[predictions]}')
+    print(f'probability:   {round(probabilities[predictions]*100,2)}%')
+check_text(model, text, list_label)
+# prediction:    1 => (B) positive.
+# probability:   98.64%
 ```