Spaces:

osanseviero
/

draw_to_search

Runtime error

App Files Files Community

osanseviero commited on Oct 12, 2021

Commit

7a990e9

1 Parent(s): 98b23d4

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -7

app.py CHANGED Viewed

@@ -1,11 +1,32 @@
-import pandas as pd, numpy as np
 import os
-from transformers import CLIPProcessor, CLIPTextModel, CLIPModel
 import gradio as gr
 import requests
 model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
@@ -26,20 +47,27 @@ def download_img(path):
     return local_path
 def predict(query):
     n_results=3
     text_embeddings = compute_text_embeddings([query]).detach().numpy()
     results = np.argsort((embeddings@text_embeddings.T)[:, 0])[-1:-n_results-1:-1]
     paths = [download_img(df.iloc[i]['path']) for i in results]
     print(paths)
-    return paths
 title = "Draw to Search"
 iface = gr.Interface(
   fn=predict,
-  inputs=[gr.inputs.Textbox(label="text", lines=3)],
-  outputs=[gr.outputs.Image(type="file"), gr.outputs.Image(type="file"), gr.outputs.Image(type="file")],
   title=title,
-  examples=[["Sunset"]]
 )
 iface.launch(debug=True)

 import os
+from pathlib import Path
+import pandas as pd, numpy as np
+from transformers import CLIPProcessor, CLIPTextModel, CLIPModel
+import torch
+from torch import nn
 import gradio as gr
 import requests
+LABELS = Path('class_names.txt').read_text().splitlines()
+class_model = nn.Sequential(
+    nn.Conv2d(1, 32, 3, padding='same'),
+    nn.ReLU(),
+    nn.MaxPool2d(2),
+    nn.Conv2d(32, 64, 3, padding='same'),
+    nn.ReLU(),
+    nn.MaxPool2d(2),
+    nn.Conv2d(64, 128, 3, padding='same'),
+    nn.ReLU(),
+    nn.MaxPool2d(2),
+    nn.Flatten(),
+    nn.Linear(1152, 256),
+    nn.ReLU(),
+    nn.Linear(256, len(LABELS)),
+)
+state_dict = torch.load('pytorch_model.bin', map_location='cpu')
+class_model.load_state_dict(state_dict, strict=False)
+class_model.eval()
 model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
     return local_path
 def predict(query):
+    x = torch.tensor(im, dtype=torch.float32).unsqueeze(0).unsqueeze(0) / 255.
+    with torch.no_grad():
+        out = class_model(x)
+    probabilities = torch.nn.functional.softmax(out[0], dim=0)
+    values, indices = torch.topk(probabilities, 5)
+    query = values[0]
     n_results=3
     text_embeddings = compute_text_embeddings([query]).detach().numpy()
     results = np.argsort((embeddings@text_embeddings.T)[:, 0])[-1:-n_results-1:-1]
     paths = [download_img(df.iloc[i]['path']) for i in results]
     print(paths)
+    return {LABELS[i]: v.item() for i, v in zip(indices, values)}, paths
 title = "Draw to Search"
 iface = gr.Interface(
   fn=predict,
+  inputs='sketchpad',
+  outputs=[outputs='label', gr.outputs.Image(type="file"), gr.outputs.Image(type="file"), gr.outputs.Image(type="file")],
   title=title,
 )
 iface.launch(debug=True)