embeding_api

Paused

Arafath10 commited on Jul 31, 2024

Commit

07fb065

verified ·

1 Parent(s): e59b55b

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -2,6 +2,19 @@ from fastapi import FastAPI, HTTPException
 from fastapi.responses import JSONResponse
 from fastapi.middleware.cors import CORSMiddleware
 app = FastAPI()
 app.add_middleware(
@@ -12,11 +25,30 @@ app.add_middleware(
     allow_headers=["*"],
 )
-@app.post("/get_n_depth_results")
-async def get_n_depth_results(url,input_query):
-          return "done"

 from fastapi.responses import JSONResponse
 from fastapi.middleware.cors import CORSMiddleware
+from transformers import AutoModel, AutoTokenizer
+import torch
+device = torch.device("cpu")
+# Load the model and tokenizer
+model = AutoModel.from_pretrained(
+    "nomic-ai/nomic-embed-text-v1.5", trust_remote_code=True
+)
+tokenizer = AutoTokenizer.from_pretrained(
+    "nomic-ai/nomic-embed-text-v1.5", trust_remote_code=True
+)
 app = FastAPI()
 app.add_middleware(
     allow_headers=["*"],
 )
+def chunk_text(text, chunk_size=512):
+    return [text[i:i + chunk_size] for i in range(0, len(text), chunk_size)]
+@app.post("/get_embeding")
+async def get_embeding(text):
+    chunks = chunk_text(text)
+    for chunk in chunks:
+        # Tokenize the input text
+        inputs = tokenizer(chunk, return_tensors="pt")
+        # Generate embeddings
+        with torch.no_grad():
+            outputs = model(**inputs)
+        # The embeddings can be found in the 'last_hidden_state'
+        embeddings = outputs.last_hidden_state
+        # Optionally, you can average the token embeddings to get a single vector for the sentence
+        sentence_embedding = torch.mean(embeddings, dim=1)
+        #print(sentence_embedding)
+        return sentence_embedding