Spaces:

owaiskha9654
/

Multi-Label-Classification-of-Pubmed-Articles

Runtime error

App Files Files Community

owaiskha9654 commited on Aug 1, 2022

Commit

415ed22

•

1 Parent(s): cd334dd

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -4

app.py CHANGED Viewed

@@ -15,8 +15,17 @@ tokenizer = BertTokenizer.from_pretrained('owaiskha9654/Multi-Label-Classificati
 def Multi_Label_Classification_of_Pubmed_Articles(model_input: str) -> Dict[str, float]:
     # Encoding input data
-    encodings = tokenizer.batch_encode_plus(model_input,max_length=1024,padding=True,truncation=True) # tokenizer's encoding method
-    outs = model(torch.tensor(encodings['input_ids']), token_type_ids=None, attention_mask=torch.tensor(encodings['attention_mask']))
     b_logit_pred = outs[0]
     pred_label = torch.sigmoid(b_logit_pred)
@@ -68,9 +77,9 @@ examples = [
 title = "Multi Label Classification of Pubmed Articles (Paper Night July Edition at Thoucentric)"
 description = "The traditional machine learning models give a lot of pain when we do not have sufficient labeled data for the specific task or domain we care about to train a reliable model. Transfer learning allows us to deal with these scenarios by leveraging the already existing labeled data of some related task or domain. We try to store this knowledge gained in solving the source task in the source domain and apply it to our problem of interest. In this work, I have utilized Transfer Learning utilizing BertForSequenceClassification model to fine tune on Pubmed MultiLabel classification Dataset."
 article = (
-    "Author: Owais Ahmad Data Scientist at Thoucentric <a href=\"https://www.linkedin.com/in/owaiskhan9654/\">Link</a> \n"
     "Model Trained Kaggle on <a href=\"https://www.kaggle.com/code/owaiskhan9654/multi-label-classification-of-pubmed-articles\">Link</a> \n "
-    "My Kaggle Profile <a href=\"https://www.kaggle.com/owaiskhan9654\">Link</a>"
     "HuggingFace Model Deployed Repository <a href=\"https://huggingface.co/owaiskha9654/Multi-Label-Classification-of-PubMed-Articles\">Link</a> \n"
 )

 def Multi_Label_Classification_of_Pubmed_Articles(model_input: str) -> Dict[str, float]:
     # Encoding input data
+    dict_custom={}
+    Preprocess_part1=model_input[:len(model_input)]
+    Preprocess_part2=model_input[len(model_input):]
+    dict1=tokenizer.encode_plus(Preprocess_part1,max_length=1024,padding=True,truncation=True)
+    dict2=tokenizer.encode_plus(Preprocess_part2,max_length=1024,padding=True,truncation=True)
+    dict_custom['input_ids']=[dict1['input_ids'],dict1['input_ids']]
+    dict_custom['token_type_ids']=[dict1['token_type_ids'],dict1['token_type_ids']]
+    dict_custom['attention_mask']=[dict1['attention_mask'],dict1['attention_mask']]
+    outs = model(torch.tensor(dict_custom['input_ids']), token_type_ids=None, attention_mask=torch.tensor(dict_custom['attention_mask']))
     b_logit_pred = outs[0]
     pred_label = torch.sigmoid(b_logit_pred)
 title = "Multi Label Classification of Pubmed Articles (Paper Night July Edition at Thoucentric)"
 description = "The traditional machine learning models give a lot of pain when we do not have sufficient labeled data for the specific task or domain we care about to train a reliable model. Transfer learning allows us to deal with these scenarios by leveraging the already existing labeled data of some related task or domain. We try to store this knowledge gained in solving the source task in the source domain and apply it to our problem of interest. In this work, I have utilized Transfer Learning utilizing BertForSequenceClassification model to fine tune on Pubmed MultiLabel classification Dataset."
 article = (
+    "Author: Owais Ahmad Data Scientist at <b> Thoucentric <b> <a href=\"https://www.linkedin.com/in/owaiskhan9654/\">Link</a>  "
     "Model Trained Kaggle on <a href=\"https://www.kaggle.com/code/owaiskhan9654/multi-label-classification-of-pubmed-articles\">Link</a> \n "
+    "My Kaggle Profile <a href=\"https://www.kaggle.com/owaiskhan9654\">Link</a>  "
     "HuggingFace Model Deployed Repository <a href=\"https://huggingface.co/owaiskha9654/Multi-Label-Classification-of-PubMed-Articles\">Link</a> \n"
 )