Spaces:

blazingbunny
/

BERT-Semantic-checker

Runtime error

blazingbunny commited on Mar 28, 2024

Commit

80f8209

verified ·

1 Parent(s): 9d4445b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,27 +1,19 @@
 import streamlit as st
-import torch
-from transformers import BertModel, BertTokenizer
-# Load pre-trained BERT model and tokenizer
 @st.cache_resource
-def load_bert():
-    tokenizer = BertTokenizer.from_pretrained('bert-base-uncased')
-    model = BertModel.from_pretrained('bert-base-uncased')
-    return tokenizer, model
-tokenizer, model = load_bert()
 def calculate_similarity(word1, word2):
-    # Tokenize and get embeddings
-    input_ids1 = torch.tensor([tokenizer.encode(word1, add_special_tokens=True)])
-    input_ids2 = torch.tensor([tokenizer.encode(word2, add_special_tokens=True)])
-    with torch.no_grad():
-        embeddings1 = model(input_ids1)[0][0, 0, :]
-        embeddings2 = model(input_ids2)[0][0, 0, :]
     cos_sim = torch.nn.functional.cosine_similarity(embeddings1, embeddings2, dim=0)
-    return cos_sim.item()  # Convert tensor to a float
 # Streamlit interface
 st.title("Word Similarity Checker")

 import streamlit as st
+from sentence_transformers import SentenceTransformer
+# Load SBERT model (choose a suitable model from https://www.sbert.net/docs/pretrained_models.html)
 @st.cache_resource
+def load_sbert():
+    model = SentenceTransformer('all-MiniLM-L6-v2')  # Example model
+    return model
+model = load_sbert()
 def calculate_similarity(word1, word2):
+    embeddings1 = model.encode(word1)
+    embeddings2 = model.encode(word2)
     cos_sim = torch.nn.functional.cosine_similarity(embeddings1, embeddings2, dim=0)
+    return cos_sim.item()
 # Streamlit interface
 st.title("Word Similarity Checker")