Spaces:

ibrim
/

CLIPModel

Runtime error

App Files Files Community

ibrim commited on Jul 29, 2024

Commit

1878377

verified ·

1 Parent(s): 3b6db54

Update app.py

Browse files

Files changed (1) hide show

app.py +92 -18

app.py CHANGED Viewed

@@ -1,3 +1,39 @@
 import gradio as gr
 import gc
 import cv2
@@ -11,30 +47,68 @@ from implement import *
 # from main import build_loaders
 # from CLIP import CLIPModel
 import os
-import zipfile
-# Define the filename
-zip_filename = 'Images.zip'
-import os
-import zipfile
 with gr.Blocks(css="style.css") as demo:
-# Define the filename
-        zip_filename = 'Images.zip'
-        # Check if the file exists
-        if os.path.isfile(zip_filename):
-            # Open the zip file
-            with zipfile.ZipFile(zip_filename, 'r') as zip_ref:
-                # Extract all contents of the zip file to the current directory
-                zip_ref.extractall()
-            print(f"'{zip_filename}' has been successfully unzipped.")
-        else:
-            print(f"'{zip_filename}' not found in the current directory.")
     # Create Gradio interface
 demo.launch(share=True)

+import os
+import zipfile
+# Define the filename
+zip_filename = 'Images.zip'
+# Get the current directory path
+current_directory = os.getcwd()
+print(f"Current directory: {current_directory}")
+# Append a custom string to the current directory path (for demonstration)
+custom_directory = os.path.join(current_directory, 'UnzippedContent')
+# Ensure the custom directory exists
+os.makedirs(custom_directory, exist_ok=True)
+# Print the contents of the current directory before unzipping
+print(f"Contents of current directory before unzipping: {os.listdir(current_directory)}")
+# Check if the zip file exists in the current directory
+zip_file_path = os.path.join(current_directory, zip_filename)
+if os.path.isfile(zip_file_path):
+    # Open the zip file
+    with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:
+        # Extract all contents of the zip file to the custom directory
+        zip_ref.extractall(custom_directory)
+    print(f"'{zip_filename}' has been successfully unzipped to '{custom_directory}'.")
+    # Print the contents of the custom directory after unzipping
+    print(f"Contents of '{custom_directory}': {os.listdir(custom_directory)}")
+else:
+    print(f"'{zip_filename}' not found in the current directory.")
+# Print the contents of the current directory after unzipping
+print(f"Contents of current directory after unzipping: {os.listdir(current_directory)}")
 import gradio as gr
 import gc
 import cv2
 # from main import build_loaders
 # from CLIP import CLIPModel
 import os
 with gr.Blocks(css="style.css") as demo:
+    def get_image_embeddings(valid_df, model_path):
+        tokenizer = DistilBertTokenizer.from_pretrained(CFG.text_tokenizer)
+        valid_loader = build_loaders(valid_df, tokenizer, mode="valid")
+        model = CLIPModel().to(CFG.device)
+        model.load_state_dict(torch.load(model_path, map_location=CFG.device))
+        model.eval()
+        valid_image_embeddings = []
+        with torch.no_grad():
+            for batch in tqdm(valid_loader):
+                image_features = model.image_encoder(batch["image"].to(CFG.device))
+                image_embeddings = model.image_projection(image_features)
+                valid_image_embeddings.append(image_embeddings)
+        return model, torch.cat(valid_image_embeddings)
+    _, valid_df = make_train_valid_dfs()
+    model, image_embeddings = get_image_embeddings(valid_df, "best.pt")
+    def find_matches(query, n=9):
+        tokenizer = DistilBertTokenizer.from_pretrained(CFG.text_tokenizer)
+        encoded_query = tokenizer([query])
+        batch = {
+            key: torch.tensor(values).to(CFG.device)
+            for key, values in encoded_query.items()
+        }
+        with torch.no_grad():
+            text_features = model.text_encoder(
+                input_ids=batch["input_ids"], attention_mask=batch["attention_mask"]
+            )
+            text_embeddings = model.text_projection(text_features)
+        image_embeddings_n = F.normalize(image_embeddings, p=2, dim=-1)
+        text_embeddings_n = F.normalize(text_embeddings, p=2, dim=-1)
+        dot_similarity = text_embeddings_n @ image_embeddings_n.T
+        _, indices = torch.topk(dot_similarity.squeeze(0), n * 5)
+        matches = [valid_df['image'].values[idx] for idx in indices[::5]]
+        images = []
+        for match in matches:
+            image = cv2.imread(f"{CFG.image_path}/{match}")
+            image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+            # images.append(image)
+        return image
+    with gr.Row():
+        textbox = gr.Textbox(label = "Enter a query to find matching images using a CLIP model.")
+        image = gr.Image(type="numpy")
+    button = gr.Button("Press")
+    button.click(
+        fn = find_matches,
+        inputs=textbox,
+        outputs=image
+    )
     # Create Gradio interface
 demo.launch(share=True)