Spaces:

Instantaneous1
/

search-by-image

Running

Instantaneous1 commited on Dec 31, 2023

Commit

3187e25

1 Parent(s): faf8b3f

pretrained embedding azure blobs

Files changed (3) hide show

README.md CHANGED Viewed

@@ -48,10 +48,20 @@ pip install -r requirements.txt
 3. Run the Streamlit app:
 ```bash
 streamlit run app.py
 ```
 4. Access the app in your web browser (usually at http://localhost:8501).
 ## Technology Stack

 3. Run the Streamlit app:
+for quickly dl embeddings and skipp training
 ```bash
 streamlit run app.py
 ```
+or
+to rebuild embeddings
+```bash
+streamlit run app.py -- --dev
+```
 4. Access the app in your web browser (usually at http://localhost:8501).
 ## Technology Stack

app.py CHANGED Viewed

@@ -10,6 +10,8 @@ from PIL import ImageFile
 from slugify import slugify
 import opendatasets as od
 import json
 ImageFile.LOAD_TRUNCATED_IMAGES = True
 FOLDER = "images/"
@@ -17,6 +19,32 @@ NUM_TREES = 100
 FEATURES = 1000
 FILETYPES = [".png", ".jpg", ".jpeg", ".tiff", ".bmp"]
 @st.cache_resource
 def load_dataset():
@@ -168,6 +196,11 @@ if __name__ == "__main__":
     try:
         load_dataset()
         save_embedding(FOLDER)
         # File uploader

 from slugify import slugify
 import opendatasets as od
 import json
+import argparse
 ImageFile.LOAD_TRUNCATED_IMAGES = True
 FOLDER = "images/"
 FEATURES = 1000
 FILETYPES = [".png", ".jpg", ".jpeg", ".tiff", ".bmp"]
+from azure.storage.blob import BlobServiceClient
+@st.cache_resource
+def dl_embeddings():
+    """dl pretrained embeddings in production environment instead of creating"""
+    # Connect to your Blob Storage account
+    connect_str = st.secrets["connectionstring"]
+    blob_service_client = BlobServiceClient.from_connection_string(connect_str)
+    # Specify container and blob names
+    container_name = "imagessearch"
+    blob_name = f"{slugify(FOLDER)}.tree"
+    # Get a reference to the blob
+    blob_client = blob_service_client.get_blob_client(
+        container=container_name, blob=blob_name
+    )
+    # Download the binary data
+    download_file_path = f"{slugify(FOLDER)}.tree"  # Path to save the downloaded file
+    with open(download_file_path, "wb") as download_file:
+        download_file.write(blob_client.download_blob().readall())
+    print(f"File downloaded to: {download_file_path}")
 @st.cache_resource
 def load_dataset():
     try:
         load_dataset()
+        # download dev embeddings if not developement environment
+        ap = argparse.ArgumentParser()
+        ap.add_argument("--dev", action="store_true")
+        if not ap.parse_args().dev:
+            dl_embeddings()
         save_embedding(FOLDER)
         # File uploader

requirements.txt CHANGED Viewed

@@ -4,4 +4,5 @@ torchvision
 streamlit
 tqdm
 python-slugify
-opendatasets

 streamlit
 tqdm
 python-slugify
+opendatasets
+azure-storage-blob