Spaces:

johann22
/

emb-1

Sleeping

App Files Files Community

johann22 commited on Jul 12

Commit

640f959

verified ·

1 Parent(s): f63f033

Create app.py

Browse files

Files changed (1) hide show

app.py +121 -0

app.py ADDED Viewed

	@@ -0,0 +1,121 @@

+import gradio as gr
+import numpy as np
+import logging
+import threading
+from sentence_transformers import SentenceTransformer
+# --- Setup Logging ---
+logging.basicConfig(level=logging.INFO)
+log = logging.getLogger(__name__)
+# --- Global SentenceTransformer Model ---
+# This pattern ensures the model is loaded only once on the first request.
+_embedder_instance = None
+_embedder_lock = threading.Lock()
+MODEL_NAME = 'all-MiniLM-L6-v2'
+def _get_embedder():
+    """
+    Lazily and thread-safely initializes and returns the SentenceTransformer embedder.
+    """
+    global _embedder_instance
+    # Use a double-checked lock to avoid acquiring the lock for every request
+    if _embedder_instance is None:
+        with _embedder_lock:
+            # Check again inside the lock to ensure it wasn't initialized by another thread
+            # while the current thread was waiting for the lock.
+            if _embedder_instance is None:
+                try:
+                    log.info(f"Loading SentenceTransformer model: {MODEL_NAME} (lazy init)...")
+                    _embedder_instance = SentenceTransformer(MODEL_NAME)
+                    log.info("SentenceTransformer model loaded successfully.")
+                except Exception as e:
+                    log.critical(f"Failed to load SentenceTransformer model: {e}", exc_info=True)
+                    # The instance remains None, so subsequent calls will retry.
+                    _embedder_instance = None
+    return _embedder_instance
+def generate_embeddings(texts: list[str]) -> dict:
+    """
+    Generates embeddings for a list of input texts.
+    Args:
+        texts: A list of strings to be embedded.
+    Returns:
+        A dictionary containing the list of embedding vectors or an error message.
+    """
+    if not isinstance(texts, list) or not all(isinstance(t, str) for t in texts):
+        # Gradio's JSON component will likely parse it correctly, but this is a good safeguard.
+        log.error("Invalid input: 'texts' must be a list of strings.")
+        return {"error": "Invalid input format. Expected a list of strings."}
+    embedder = _get_embedder()
+    if embedder is None:
+        log.error("Embedder not available. Cannot generate embeddings.")
+        # We don't return a 500 error here so the client can see the message.
+        # In a real production system, you might raise an exception to trigger a 500.
+        return {"error": "Embedding model is not available. Please check the server logs."}
+    try:
+        log.info(f"Generating embeddings for {len(texts)} text(s).")
+        # The encode function is thread-safe.
+        embeddings = embedder.encode(texts, convert_to_numpy=True).tolist()
+        log.info("Embeddings generated successfully.")
+        return {"embeddings": embeddings}
+    except Exception as e:
+        log.error(f"An error occurred during embedding generation: {e}", exc_info=True)
+        return {"error": f"An unexpected error occurred: {e}"}
+# --- Create the Gradio Interface ---
+# We use gr.JSON for both input and output for maximum flexibility and API-friendliness.
+description = """
+### Sentence Embedding API
+This API provides access to the `all-MiniLM-L6-v2` sentence embedding model.
+**How to use the API:**
+1. Send a POST request to the `/api/generate_embeddings/` endpoint.
+2. The body of the request should be a JSON object with a "data" key.
+3. The value of "data" should be an array containing one element: a list of the texts you want to embed.
+**Example using `curl`:**
+    curl -X POST "https://YOUR-SPACE-NAME.hf.space/api/generate_embeddings/" \\
+    -H "Content-Type: application/json" \\
+    -d '{"data": [["Hello, world!", "This is another sentence."]]}'
+**Expected Success Response (JSON):**
+    {
+      "data": [
+        {
+          "embeddings": [
+            [-0.0139..., 0.0523..., ..., -0.0111...],
+            [0.0229..., -0.0149..., ..., 0.0515...]
+          ]
+        }
+      ],
+      "is_generating": false,
+      "duration": 0.5,
+      "average_duration": 0.5
+    }
+"""
+demo = gr.Interface(
+    fn=generate_embeddings,
+    inputs=gr.JSON(
+        label="Input Texts",
+        info='Provide a list of strings, e.g., ["text 1", "text 2"]'
+    ),
+    outputs=gr.JSON(label="Output Embeddings"),
+    title="Sentence Embedding API Service",
+    description=description,
+    examples=[
+        [[["Hello world", "Gradio is a great tool for building ML apps."]]],
+        [[["What is the capital of France?"]]]
+    ],
+    api_name="generate_embeddings" # This creates the /api/generate_embeddings/ endpoint
+)
+if __name__ == "__main__":
+    demo.launch()