Spaces:
Build error
Build error
File size: 682 Bytes
25fc3a2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
from transformers import AutoTokenizer, AutoModel
import torch
class EmbeddingGenerator:
def __init__(self):
self.model_name = "deepset/all-mpnet-base-v2-table"
self.tokenizer = AutoTokenizer.from_pretrained(self.model_name)
self.model = AutoModel.from_pretrained(self.model_name)
def generate_embeddings(self, dataframes):
embeddings = []
for df in dataframes:
inputs = self.tokenizer(df.to_string(index=False), return_tensors='pt', truncation=True, padding=True)
outputs = self.model(**inputs)
embeddings.append(outputs.last_hidden_state.mean(dim=1).detach().numpy())
return embeddings
|