Spaces:

lmms-lab
/

Multimodal-SAE

Runtime error

App Files Files Community

kcz358 commited on Mar 9

Commit

d6910a2

1 Parent(s): 18b266d

Allow shown auto interp explanation

Browse files

Files changed (1) hide show

app.py +22 -4

app.py CHANGED Viewed

@@ -5,6 +5,9 @@ from sae_auto_interp.features.features import upsample_mask
 import torch
 from transformers import AutoTokenizer
 from PIL import Image
 import spaces
 CITATION_BUTTON_TEXT = """
@@ -76,7 +79,7 @@ def generate_activations(image):
         result.scatter_(-1, topk.indices, topk.values)
         cached_list.append(result.detach().cpu())
         topk_indices = (
-            latents.squeeze(0).mean(dim=0).topk(k=100).indices.detach().cpu()
         )
     handles = [hooked_module.register_forward_hook(hook)]
@@ -91,9 +94,14 @@ def generate_activations(image):
     finally:
         for handle in handles:
             handle.remove()
     torch.cuda.empty_cache()
-    return topk_indices, cached_list[0]
 def visualize_activations(image, feature_num, cached_tensor):
     base_img_tokens = 576
@@ -208,11 +216,12 @@ with gr.Blocks() as demo:
             with gr.Row():
                 with gr.Column():
                     image = gr.Image(type="pil", interactive=True, label="Sample Image")
-                    topk_features = gr.Textbox(value=topk_indices, placeholder="Top 100 Features", label="Top 100 Features")
                     with gr.Row():
                         clear_btn = gr.ClearButton([image, topk_features], value="Clear")
                         submit_btn = gr.Button("Submit", variant="primary")
-                        submit_btn.click(generate_activations, inputs=[image], outputs=[topk_features, cached_tensor])
                 with gr.Column():
                     output = gr.Image(label="Activation Visualization")
                     feature_num = gr.Slider(1, 131072, 1, 1, label="Feature Number", interactive=True)
@@ -272,5 +281,14 @@ if __name__ == "__main__":
         hf_token=None
     )
     hooked_module = model.language_model.get_submodule("model.layers.24")
     demo.launch()

 import torch
 from transformers import AutoTokenizer
 from PIL import Image
+from datasets import load_dataset
+from tqdm import tqdm
+import pandas as pd
 import spaces
 CITATION_BUTTON_TEXT = """
         result.scatter_(-1, topk.indices, topk.values)
         cached_list.append(result.detach().cpu())
         topk_indices = (
+            latents.squeeze(0).mean(dim=0).topk(k=200).indices.detach().cpu()
         )
     handles = [hooked_module.register_forward_hook(hook)]
     finally:
         for handle in handles:
             handle.remove()
+    examples = []
+    for indice in topk_indices:
+        if indice <= 5000:
+            examples.append([ f"model.layers.24_feature{indice.item()}",explanations[f"model.layers.24_feature{indice.item()}"]])
     torch.cuda.empty_cache()
+    return topk_indices, cached_list[0], examples
 def visualize_activations(image, feature_num, cached_tensor):
     base_img_tokens = 576
             with gr.Row():
                 with gr.Column():
                     image = gr.Image(type="pil", interactive=True, label="Sample Image")
+                    topk_features = gr.Textbox(value=topk_indices, placeholder="Top 200 Features", label="Top 100 Features", max_lines=5)
+                    known_explanation = gr.DataFrame(headers=["Feature", "Auto Interp Explanation"], label="Auto Interp Explanations")
                     with gr.Row():
                         clear_btn = gr.ClearButton([image, topk_features], value="Clear")
                         submit_btn = gr.Button("Submit", variant="primary")
+                        submit_btn.click(generate_activations, inputs=[image], outputs=[topk_features, cached_tensor, known_explanation])
                 with gr.Column():
                     output = gr.Image(label="Activation Visualization")
                     feature_num = gr.Slider(1, 131072, 1, 1, label="Feature Number", interactive=True)
         hf_token=None
     )
     hooked_module = model.language_model.get_submodule("model.layers.24")
+    dataset = load_dataset("lmms-lab/llava-sae-explanations-5k", "legacy", split="test")
+    dataset = dataset.remove_columns(["top1", "top2", "top3", "top4", "top5"])
+    print("Loading Explanation")
+    explanations = {}
+    pbar = tqdm(total=len(dataset), desc="Loading Explanation")
+    for da in dataset:
+        explanations[da["feature"]] = da["explanations"]
+        pbar.update(1)
+    pbar.close()
     demo.launch()