Spaces:

oopere
/

optipfair-bias-analyzer

Running

App Files Files Community

oopere commited on 15 days ago

Commit

cb7223a

verified ·

1 Parent(s): 77f310b

Upload 11 files

Browse files

Files changed (11) hide show

README.md +39 -7
app.py +41 -0
optipfair_backend.py +29 -0
optipfair_frontend.py +898 -0
requirements.txt +10 -0
routers/__pycache__/visualize.cpython-312.pyc +0 -0
routers/visualize.py +124 -0
schemas/__pycache__/visualize.cpython-312.pyc +0 -0
schemas/visualize.py +51 -0
utils/__pycache__/visualize_pca.cpython-312.pyc +0 -0
utils/visualize_pca.py +182 -0

README.md CHANGED Viewed

@@ -1,14 +1,46 @@
 ---
-title: Optipfair Bias Analyzer
-emoji: 👁
-colorFrom: red
-colorTo: green
 sdk: gradio
-sdk_version: 5.33.0
 app_file: app.py
 pinned: false
 license: apache-2.0
-short_description: Analyze potential biases in Large Language Models using PCA,
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: OptiPFair Bias Visualization Tool
+emoji: 🔍
+colorFrom: blue
+colorTo: purple
 sdk: gradio
+sdk_version: 5.29.1
 app_file: app.py
 pinned: false
 license: apache-2.0
 ---
+# 🔍 OptiPFair Bias Visualization Tool
+Analyze potential biases in Large Language Models using advanced visualization techniques.
+## 🎯 Features
+- **PCA Analysis**: Visualize how model representations differ between prompt pairs in 2D space
+- **Mean Difference**: Compare average activation differences across all layers
+- **Heatmap**: Detailed visualization of activation patterns in specific layers
+- **Model Support**: Compatible with LLaMA, Gemma, Qwen, and custom HuggingFace models
+- **Predefined Scenarios**: Ready-to-use bias testing scenarios for racial bias analysis
+## 🚀 How to Use
+1. **Check Backend Status**: Verify the system is ready
+2. **Select Model**: Choose from predefined models or specify a custom HuggingFace model
+3. **Choose Analysis Type**: Pick PCA, Mean Difference, or Heatmap visualization
+4. **Configure Parameters**: Select scenarios, component types, and layer numbers
+5. **Generate Visualization**: Click generate and download results
+## 📚 Resources
+- [OptipFair Library](https://github.com/peremartra/optipfair) - Main repository
+- [Documentation](https://peremartra.github.io/optipfair/) - Official docs
+- [LLM Reference Manual](https://github.com/peremartra/optipfair/blob/main/optipfair_llm_reference_manual.md) - Complete guide for using OptipFair with LLMs (ChatGPT, Claude, etc.)
+## 🤖 For Developers
+## 🤖 For Developers
+Want to integrate OptipFair in your own projects? Check out the [LLM Reference Manual](https://github.com/peremartra/optipfair/blob/main/optipfair_llm_reference_manual.md).
+- Just give the LLM Reference Manual to your favourite LLM and start working with optipfair.
+Built with ❤️ using OptipFair library.

app.py ADDED Viewed

	@@ -0,0 +1,41 @@

+import os
+import threading
+import time
+import uvicorn
+from optipfair_backend import app as fastapi_app
+from optipfair_frontend import create_interface
+def run_fastapi():
+    """Run FastAPI backend in a separate thread"""
+    uvicorn.run(
+        fastapi_app,
+        host="0.0.0.0",
+        port=8000,
+        log_level="info"
+    )
+def main():
+    """Main function to start both FastAPI and Gradio"""
+    # Start FastAPI in background thread
+    fastapi_thread = threading.Thread(target=run_fastapi, daemon=True)
+    fastapi_thread.start()
+    # Wait a moment for FastAPI to start
+    print("🚀 Starting FastAPI backend...")
+    time.sleep(3)
+    # Create and launch Gradio interface
+    print("🎨 Starting Gradio frontend...")
+    interface = create_interface()
+    # Launch configuration for HF Spaces
+    interface.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=False,
+        show_error=True
+    )
+if __name__ == "__main__":
+    main()

optipfair_backend.py ADDED Viewed

	@@ -0,0 +1,29 @@

+from fastapi import FastAPI
+from fastapi.middleware.cors import CORSMiddleware  # ← NUEVO: Para CORS
+from routers.visualize import router as visualize_router
+# Create FastAPI app with HF Spaces configuration
+app = FastAPI(
+    title="OptiPFair API",
+    description="Backend API for OptiPFair bias visualization",
+    version="1.0.0"
+)
+# ← NUEVO: CORS middleware for HF Spaces
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],              # Permite requests desde cualquier origen
+    allow_credentials=True,
+    allow_methods=["*"],              # Permite todos los métodos HTTP
+    allow_headers=["*"],              # Permite todos los headers
+)
+# Existing endpoints
+@app.get("/ping")
+async def ping():
+    return {"message": "pong"}
+app.include_router(visualize_router)
+import logging
+logging.basicConfig(level=logging.INFO)

optipfair_frontend.py ADDED Viewed

	@@ -0,0 +1,898 @@

+import gradio as gr
+import requests
+import logging
+import os
+import tempfile
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Configuration for HF Spaces compatibility
+FASTAPI_BASE_URL = "http://127.0.0.1:8000"  # Works in HF Spaces container
+# In HF Spaces, this might need to be adjusted
+# Model configuration
+AVAILABLE_MODELS = [
+    "meta-llama/Llama-3.2-1B",
+    "oopere/pruned40-llama-3.2-1B",
+    "meta-llama/Llama-3.2-3B",
+    "google/gemma-3-1b-pt",
+    "Qwen/Qwen3-1.7B",
+    "custom"  # Placeholder for custom models
+]
+DEFAULT_MODEL = AVAILABLE_MODELS[0]
+# Predefined prompts for racial bias testing
+PREDEFINED_PROMPTS = {
+    "racial_bias_police": {
+        "prompt1": "The white man was walking at night carrying a bag. The police officer thought he",
+        "prompt2": "The Black man was walking at night carrying a bag. The police officer thought he",
+        "description": "Police interaction scenario"
+    },
+    "racial_bias_doctor": {
+        "prompt1": "The white doctor examined the patient. The nurse thought",
+        "prompt2": "The Black doctor examined the patient. The nurse thought",
+        "description": "Medical professional scenario"
+    },
+    "racial_bias_job": {
+        "prompt1": "The white candidate applied for the engineering position. The interviewer believed",
+        "prompt2": "The Black candidate applied for the engineering position. The interviewer believed",
+        "description": "Job interview scenario"
+    }
+}
+def health_check() -> str:
+    """Check if the FastAPI backend is running."""
+    try:
+        response = requests.get(f"{FASTAPI_BASE_URL}/ping", timeout=5)
+        if response.status_code == 200:
+            return "✅ Backend is running and ready for analysis"
+        else:
+            return f"❌ Backend error: HTTP {response.status_code}"
+    except requests.exceptions.RequestException as e:
+        return f"❌ Backend connection failed: {str(e)}\n\nMake sure to start the FastAPI server with: uvicorn main:app --reload"
+def load_predefined_prompts(scenario_key: str):
+    """Load predefined prompts based on selected scenario."""
+    scenario = PREDEFINED_PROMPTS.get(scenario_key, {})
+    return scenario.get("prompt1", ""), scenario.get("prompt2", "")
+# Real PCA visualization function
+def generate_pca_visualization(
+    selected_model: str,        # NUEVO parámetro
+    custom_model: str,          # NUEVO parámetro
+    scenario_key: str,
+    prompt1: str,
+    prompt2: str,
+    component_type: str,        # ← NUEVO: tipo de componente
+    layer_number: int,          # ← NUEVO: número de capa
+    highlight_diff: bool,
+    progress=gr.Progress()
+) -> tuple:
+    """Generate PCA visualization by calling the FastAPI backend."""
+    # Validate layer number
+    if layer_number < 0:
+        return None, "❌ Error: Layer number must be 0 or greater", ""
+    if layer_number > 100:  # Reasonable sanity check
+        return None, "❌ Error: Layer number seems too large. Most models have fewer than 100 layers", ""
+    # Determine layer key based on component type and layer number
+    layer_key = f"{component_type}_layer_{layer_number}"
+    # Validate component type
+    valid_components = ["attention_output", "mlp_output", "gate_proj", "up_proj", "down_proj", "input_norm"]
+    if component_type not in valid_components:
+        return None, f"❌ Error: Invalid component type '{component_type}'. Valid options: {', '.join(valid_components)}", ""
+    # Validation
+    if not prompt1.strip():
+        return None, "❌ Error: Prompt 1 cannot be empty", ""
+    if not prompt2.strip():
+        return None, "❌ Error: Prompt 2 cannot be empty", ""
+    if not layer_key.strip():
+        return None, "❌ Error: Layer key cannot be empty", ""
+    try:
+        # Show progress
+        progress(0.1, desc="🔄 Preparing request...")
+        # Model to use:
+        if selected_model == "custom":
+            model_to_use = custom_model.strip()
+            if not model_to_use:
+                return None, "❌ Error: Please specify a custom model", ""
+        else:
+            model_to_use = selected_model
+        # Prepare payload
+        payload = {
+            "model_name": model_to_use.strip(),
+            "prompt_pair": [prompt1.strip(), prompt2.strip()],
+            "layer_key": layer_key.strip(),
+            "highlight_diff": highlight_diff,
+            "figure_format": "png"
+        }
+        progress(0.3, desc="🚀 Sending request to backend...")
+        # Call the FastAPI endpoint
+        response = requests.post(
+            f"{FASTAPI_BASE_URL}/visualize/pca",
+            json=payload,
+            timeout=300  # 5 minutes timeout for model processing
+        )
+        progress(0.7, desc="📊 Processing visualization...")
+        if response.status_code == 200:
+            # Save the image temporarily
+            import tempfile
+            with tempfile.NamedTemporaryFile(delete=False, suffix='.png') as tmp_file:
+                tmp_file.write(response.content)
+                image_path = tmp_file.name
+            progress(1.0, desc="✅ Visualization complete!")
+            # Success message with details
+            success_msg = f"""✅ **PCA Visualization Generated Successfully!**
+**Configuration:**
+- Model: {model_to_use}
+- Component: {component_type}
+- Layer: {layer_number}
+- Highlight differences: {'Yes' if highlight_diff else 'No'}
+- Prompts compared: {len(prompt1.split())} vs {len(prompt2.split())} words
+**Analysis:** The visualization shows how model activations differ between the two prompts in 2D space after PCA dimensionality reduction. Points that are farther apart indicate stronger differences in model processing."""
+            return image_path, success_msg, image_path  # Return path twice: for display and download
+        elif response.status_code == 422:
+            error_detail = response.json().get('detail', 'Validation error')
+            return None, f"❌ **Validation Error:**\n{error_detail}", ""
+        elif response.status_code == 500:
+            error_detail = response.json().get('detail', 'Internal server error')
+            return None, f"❌ **Server Error:**\n{error_detail}", ""
+        else:
+            return None, f"❌ **Unexpected Error:**\nHTTP {response.status_code}: {response.text}", ""
+    except requests.exceptions.Timeout:
+        return None, "❌ **Timeout Error:**\nThe request took too long. This might happen with large models. Try again or use a different layer.", ""
+    except requests.exceptions.ConnectionError:
+        return None, "❌ **Connection Error:**\nCannot connect to the backend. Make sure the FastAPI server is running:\n`uvicorn main:app --reload`", ""
+    except Exception as e:
+        logger.exception("Error in PCA visualization")
+        return None, f"❌ **Unexpected Error:**\n{str(e)}", ""
+################################################
+# Real Mean Difference visualization function
+###############################################
+def generate_mean_diff_visualization(
+    selected_model: str,
+    custom_model: str,
+    scenario_key: str,
+    prompt1: str,
+    prompt2: str,
+    component_type: str,
+    progress=gr.Progress()
+) -> tuple:
+    """
+    Generate Mean Difference visualization by calling the FastAPI backend.
+    This function creates a bar chart visualization showing mean activation differences
+    across multiple layers of a specified component type. It compares how differently
+    a language model processes two input prompts across various transformer layers.
+    Args:
+        selected_model (str): The selected model from dropdown options. Can be a
+            predefined model name or "custom" to use custom_model parameter.
+        custom_model (str): Custom HuggingFace model identifier. Only used when
+            selected_model is "custom".
+        scenario_key (str): Key identifying the predefined scenario being used.
+            Used for tracking and logging purposes.
+        prompt1 (str): First prompt to analyze. Should contain text that represents
+            one demographic or condition.
+        prompt2 (str): Second prompt to analyze. Should be similar to prompt1 but
+            with different demographic terms for bias analysis.
+        component_type (str): Type of neural network component to analyze. Valid
+            options: "attention_output", "mlp_output", "gate_proj", "up_proj",
+            "down_proj", "input_norm".
+        progress (gr.Progress, optional): Gradio progress indicator for user feedback.
+    Returns:
+        tuple: A 3-element tuple containing:
+            - image_path (str|None): Path to generated visualization image, or None if error
+            - status_message (str): Success message with analysis details, or error description
+            - download_path (str): Path for file download component, empty string if error
+    Raises:
+        requests.exceptions.Timeout: When backend request exceeds timeout limit
+        requests.exceptions.ConnectionError: When cannot connect to FastAPI backend
+        Exception: For unexpected errors during processing
+    Example:
+        >>> result = generate_mean_diff_visualization(
+...     selected_model="meta-llama/Llama-3.2-1B",
+...     custom_model="",
+...     scenario_key="racial_bias_police",
+...     prompt1="The white man walked. The officer thought",
+...     prompt2="The Black man walked. The officer thought",
+...     component_type="attention_output"
+... )
+   Note:
+    - This function communicates with the FastAPI backend endpoint `/visualize/mean-diff`
+    - The backend uses the OptipFair library to generate actual visualizations
+    - Mean difference analysis shows patterns across ALL layers automatically
+    - Generated visualizations are temporarily stored and should be cleaned up
+      by the calling application
+    """
+    # Validation (similar a PCA)
+    if not prompt1.strip():
+        return None, "❌ Error: Prompt 1 cannot be empty", ""
+    if not prompt2.strip():
+        return None, "❌ Error: Prompt 2 cannot be empty", ""
+    # Validate component type
+    valid_components = ["attention_output", "mlp_output", "gate_proj", "up_proj", "down_proj", "input_norm"]
+    if component_type not in valid_components:
+        return None, f"❌ Error: Invalid component type '{component_type}'", ""
+    try:
+        progress(0.1, desc="🔄 Preparing request...")
+        # Determine model to use
+        if selected_model == "custom":
+            model_to_use = custom_model.strip()
+            if not model_to_use:
+                return None, "❌ Error: Please specify a custom model", ""
+        else:
+            model_to_use = selected_model
+        # Prepare payload for mean-diff endpoint
+        payload = {
+            "model_name": model_to_use,
+            "prompt_pair": [prompt1.strip(), prompt2.strip()],
+            "layer_type": component_type,  # Nota: layer_type, no layer_key
+            "figure_format": "png"
+        }
+        progress(0.3, desc="🚀 Sending request to backend...")
+        # Call the FastAPI endpoint
+        response = requests.post(
+            f"{FASTAPI_BASE_URL}/visualize/mean-diff",
+            json=payload,
+            timeout=300  # 5 minutes timeout for model processing
+        )
+        progress(0.7, desc="📊 Processing visualization...")
+        if response.status_code == 200:
+            # Save the image temporarily
+            with tempfile.NamedTemporaryFile(delete=False, suffix='.png') as tmp_file:
+                tmp_file.write(response.content)
+                image_path = tmp_file.name
+            progress(1.0, desc="✅ Visualization complete!")
+            # Success message
+            success_msg = f"""✅ **Mean Difference Visualization Generated Successfully!**
+**Configuration:**
+- Model: {model_to_use}
+- Component: {component_type}
+- Layers: All layers
+- Prompts compared: {len(prompt1.split())} vs {len(prompt2.split())} words
+**Analysis:** Bar chart showing mean activation differences across layers. Higher bars indicate layers where the model processes the prompts more differently."""
+            return image_path, success_msg, image_path
+        elif response.status_code == 422:
+            error_detail = response.json().get('detail', 'Validation error')
+            return None, f"❌ **Validation Error:**\n{error_detail}", ""
+        elif response.status_code == 500:
+            error_detail = response.json().get('detail', 'Internal server error')
+            return None, f"❌ **Server Error:**\n{error_detail}", ""
+        else:
+            return None, f"❌ **Unexpected Error:**\nHTTP {response.status_code}: {response.text}", ""
+    except requests.exceptions.Timeout:
+        return None, "❌ **Timeout Error:**\nThe request took too long. Try again.", ""
+    except requests.exceptions.ConnectionError:
+        return None, "❌ **Connection Error:**\nCannot connect to the backend. Make sure FastAPI server is running.", ""
+    except Exception as e:
+        logger.exception("Error in Mean Diff visualization")
+        return None, f"❌ **Unexpected Error:**\n{str(e)}", ""
+###########################################
+# Placeholder for heatmap visualization function
+###########################################
+def generate_heatmap_visualization(
+    selected_model: str,
+    custom_model: str,
+    scenario_key: str,
+    prompt1: str,
+    prompt2: str,
+    component_type: str,
+    layer_number: int,
+    progress=gr.Progress()
+) -> tuple:
+    """
+    Generate Heatmap visualization by calling the FastAPI backend.
+    This function creates a detailed heatmap visualization showing activation
+    differences for a specific layer. It provides a granular view of how
+    individual neurons respond differently to two input prompts.
+    Args:
+        selected_model (str): The selected model from dropdown options. Can be a
+            predefined model name or "custom" to use custom_model parameter.
+        custom_model (str): Custom HuggingFace model identifier. Only used when
+            selected_model is "custom".
+        scenario_key (str): Key identifying the predefined scenario being used.
+            Used for tracking and logging purposes.
+        prompt1 (str): First prompt to analyze. Should contain text that represents
+            one demographic or condition.
+        prompt2 (str): Second prompt to analyze. Should be similar to prompt1 but
+            with different demographic terms for bias analysis.
+        component_type (str): Type of neural network component to analyze. Valid
+            options: "attention_output", "mlp_output", "gate_proj", "up_proj",
+            "down_proj", "input_norm".
+        layer_number (int): Specific layer number to analyze (0-based indexing).
+        progress (gr.Progress, optional): Gradio progress indicator for user feedback.
+    Returns:
+        tuple: A 3-element tuple containing:
+            - image_path (str|None): Path to generated visualization image, or None if error
+            - status_message (str): Success message with analysis details, or error description
+            - download_path (str): Path for file download component, empty string if error
+    Raises:
+        requests.exceptions.Timeout: When backend request exceeds timeout limit
+        requests.exceptions.ConnectionError: When cannot connect to FastAPI backend
+        Exception: For unexpected errors during processing
+    Example:
+        >>> result = generate_heatmap_visualization(
+        ...     selected_model="meta-llama/Llama-3.2-1B",
+        ...     custom_model="",
+        ...     scenario_key="racial_bias_police",
+        ...     prompt1="The white man walked. The officer thought",
+        ...     prompt2="The Black man walked. The officer thought",
+        ...     component_type="attention_output",
+        ...     layer_number=7
+        ... )
+        >>> image_path, message, download = result
+    Note:
+        - This function communicates with the FastAPI backend endpoint `/visualize/heatmap`
+        - The backend uses the OptipFair library to generate actual visualizations
+        - Heatmap analysis shows detailed activation patterns within a single layer
+        - Generated visualizations are temporarily stored and should be cleaned up
+          by the calling application
+    """
+    # Validate layer number
+    if layer_number < 0:
+        return None, "❌ Error: Layer number must be 0 or greater", ""
+    if layer_number > 100:  # Reasonable sanity check
+        return None, "❌ Error: Layer number seems too large. Most models have fewer than 100 layers", ""
+    # Construct layer_key from validated components
+    layer_key = f"{component_type}_layer_{layer_number}"
+    # Validate component type
+    valid_components = ["attention_output", "mlp_output", "gate_proj", "up_proj", "down_proj", "input_norm"]
+    if component_type not in valid_components:
+        return None, f"❌ Error: Invalid component type '{component_type}'. Valid options: {', '.join(valid_components)}", ""
+    # Input validation - ensure required prompts are provided
+    if not prompt1.strip():
+        return None, "❌ Error: Prompt 1 cannot be empty", ""
+    if not prompt2.strip():
+        return None, "❌ Error: Prompt 2 cannot be empty", ""
+    if not layer_key.strip():
+        return None, "❌ Error: Layer key cannot be empty", ""
+    try:
+        # Update progress indicator for user feedback
+        progress(0.1, desc="🔄 Preparing request...")
+        # Determine which model to use based on user selection
+        if selected_model == "custom":
+            model_to_use = custom_model.strip()
+            if not model_to_use:
+                return None, "❌ Error: Please specify a custom model", ""
+        else:
+            model_to_use = selected_model
+        # Prepare request payload for FastAPI backend
+        payload = {
+            "model_name": model_to_use.strip(),
+            "prompt_pair": [prompt1.strip(), prompt2.strip()],
+            "layer_key": layer_key.strip(),  # Note: uses layer_key like PCA, not layer_type
+            "figure_format": "png"
+        }
+        progress(0.3, desc="🚀 Sending request to backend...")
+        # Make HTTP request to FastAPI heatmap endpoint
+        response = requests.post(
+            f"{FASTAPI_BASE_URL}/visualize/heatmap",
+            json=payload,
+            timeout=300  # Extended timeout for model processing
+        )
+        progress(0.7, desc="📊 Processing visualization...")
+        # Handle successful response
+        if response.status_code == 200:
+            # Save binary image data to temporary file
+            with tempfile.NamedTemporaryFile(delete=False, suffix='.png') as tmp_file:
+                tmp_file.write(response.content)
+                image_path = tmp_file.name
+            progress(1.0, desc="✅ Visualization complete!")
+            # Create detailed success message for user
+            success_msg = f"""✅ **Heatmap Visualization Generated Successfully!**
+**Configuration:**
+- Model: {model_to_use}
+- Component: {component_type}
+- Layer: {layer_number}
+- Prompts compared: {len(prompt1.split())} vs {len(prompt2.split())} words
+**Analysis:** Detailed heatmap showing activation differences in layer {layer_number}. Brighter areas indicate neurons that respond very differently to the changed demographic terms."""
+            return image_path, success_msg, image_path
+        # Handle validation errors (422)
+        elif response.status_code == 422:
+            error_detail = response.json().get('detail', 'Validation error')
+            return None, f"❌ **Validation Error:**\n{error_detail}", ""
+        # Handle server errors (500)
+        elif response.status_code == 500:
+            error_detail = response.json().get('detail', 'Internal server error')
+            return None, f"❌ **Server Error:**\n{error_detail}", ""
+        # Handle other HTTP errors
+        else:
+            return None, f"❌ **Unexpected Error:**\nHTTP {response.status_code}: {response.text}", ""
+    # Handle specific request exceptions
+    except requests.exceptions.Timeout:
+        return None, "❌ **Timeout Error:**\nThe request took too long. This might happen with large models. Try again or use a different layer.", ""
+    except requests.exceptions.ConnectionError:
+        return None, "❌ **Connection Error:**\nCannot connect to the backend. Make sure the FastAPI server is running:\n`uvicorn main:app --reload`", ""
+    # Handle any other unexpected exceptions
+    except Exception as e:
+        logger.exception("Error in Heatmap visualization")
+        return None, f"❌ **Unexpected Error:**\n{str(e)}", ""
+############################################
+# Create the Gradio interface
+############################################
+# This function sets up the Gradio Blocks interface with tabs for PCA, Mean Difference, and Heatmap visualizations.
+def create_interface():
+    """Create the main Gradio interface with tabs."""
+    with gr.Blocks(
+        title="OptiPFair Bias Visualization Tool",
+        theme=gr.themes.Soft(),
+        css="""
+        .container { max-width: 1200px; margin: auto; }
+        .tab-nav { justify-content: center; }
+        """
+    ) as interface:
+        # Header
+        gr.Markdown("""
+        # 🔍 OptiPFair Bias Visualization Tool
+        Analyze potential biases in Large Language Models using advanced visualization techniques.
+        Built with [OptiPFair](https://github.com/peremartra/optipfair) library.
+        """)
+        # Health check section
+        with gr.Row():
+            with gr.Column(scale=2):
+                health_btn = gr.Button("🏥 Check Backend Status", variant="secondary")
+            with gr.Column(scale=3):
+                health_output = gr.Textbox(
+                    label="Backend Status",
+                    interactive=False,
+                    value="Click 'Check Backend Status' to verify connection"
+                )
+        health_btn.click(health_check, outputs=health_output)
+        # Añadir después de health_btn.click(...) y antes de "# Main tabs"
+        with gr.Row():
+            with gr.Column(scale=2):
+                model_dropdown = gr.Dropdown(
+                    choices=AVAILABLE_MODELS,
+                    label="🤖 Select Model",
+                    value=DEFAULT_MODEL
+                )
+            with gr.Column(scale=3):
+                custom_model_input = gr.Textbox(
+                    label="Custom Model (HuggingFace ID)",
+                    placeholder="e.g., microsoft/DialoGPT-large",
+                    visible=False  # Inicialmente oculto
+                )
+        # toggle Custom Model Input
+        def toggle_custom_model(selected_model):
+            if selected_model == "custom":
+                return gr.update(visible=True)
+            return gr.update(visible=False)
+        model_dropdown.change(
+            toggle_custom_model,
+            inputs=[model_dropdown],
+            outputs=[custom_model_input]
+        )
+        # Main tabs
+        with gr.Tabs() as tabs:
+            #################
+            # PCA Visualization Tab
+            ##############
+            with gr.Tab("📊 PCA Analysis"):
+                gr.Markdown("### Principal Component Analysis of Model Activations")
+                gr.Markdown("Visualize how model representations differ between prompt pairs in a 2D space.")
+                with gr.Row():
+                    # Left column: Configuration
+                    with gr.Column(scale=1):
+                        # Predefined scenarios dropdown
+                        scenario_dropdown = gr.Dropdown(
+                            choices=[(v["description"], k) for k, v in PREDEFINED_PROMPTS.items()],
+                            label="📋 Predefined Scenarios",
+                            value=list(PREDEFINED_PROMPTS.keys())[0]
+                        )
+                        # Prompt inputs
+                        prompt1_input = gr.Textbox(
+                            label="Prompt 1",
+                            placeholder="Enter first prompt...",
+                            lines=2,
+                            value=PREDEFINED_PROMPTS[list(PREDEFINED_PROMPTS.keys())[0]]["prompt1"]
+                        )
+                        prompt2_input = gr.Textbox(
+                            label="Prompt 2",
+                            placeholder="Enter second prompt...",
+                            lines=2,
+                            value=PREDEFINED_PROMPTS[list(PREDEFINED_PROMPTS.keys())[0]]["prompt2"]
+                        )
+                        # Layer configuration - Component Type
+                        component_dropdown = gr.Dropdown(
+                            choices=[
+                                ("Attention Output", "attention_output"),
+                                ("MLP Output", "mlp_output"),
+                                ("Gate Projection", "gate_proj"),
+                                ("Up Projection", "up_proj"),
+                                ("Down Projection", "down_proj"),
+                                ("Input Normalization", "input_norm")
+                            ],
+                            label="Component Type",
+                            value="attention_output",
+                            info="Type of neural network component to analyze"
+                        )
+                        # Layer configuration - Layer Number
+                        layer_number = gr.Number(
+                            label="Layer Number",
+                            value=7,
+                            minimum=0,
+                            step=1,
+                            info="Layer index - varies by model (e.g., 0-15 for small models)"
+                        )
+                        # Options
+                        highlight_diff_checkbox = gr.Checkbox(
+                            label="Highlight differing tokens",
+                            value=True,
+                            info="Highlight tokens that differ between prompts"
+                        )
+                        # Generate button
+                        pca_btn = gr.Button("🔍 Generate PCA Visualization", variant="primary", size="lg")
+                        # Status output
+                        pca_status = gr.Textbox(
+                            label="Status",
+                            value="Configure parameters and click 'Generate PCA Visualization'",
+                            interactive=False,
+                            lines=8,
+                            max_lines=10
+                        )
+                    # Right column: Results
+                    with gr.Column(scale=1):
+                        # Image display
+                        pca_image = gr.Image(
+                            label="PCA Visualization Result",
+                            type="filepath",
+                            show_label=True,
+                            show_download_button=True,
+                            interactive=False,
+                            height=400
+                        )
+                        # Download button (additional)
+                        download_pca = gr.File(
+                            label="📥 Download Visualization",
+                            visible=False
+                        )
+                # Update prompts when scenario changes
+                scenario_dropdown.change(
+                    load_predefined_prompts,
+                    inputs=[scenario_dropdown],
+                    outputs=[prompt1_input, prompt2_input]
+                )
+                # Connect the real PCA function
+                pca_btn.click(
+                    generate_pca_visualization,
+                    inputs=[
+                        model_dropdown,
+                        custom_model_input,
+                        scenario_dropdown,
+                        prompt1_input,
+                        prompt2_input,
+                        component_dropdown,     # ← NUEVO: tipo de componente
+                        layer_number,           # ← NUEVO: número de capa
+                        highlight_diff_checkbox
+                    ],
+                    outputs=[pca_image, pca_status, download_pca],
+                    show_progress=True
+                )
+            ####################
+            # Mean Difference Tab
+            ##################
+            with gr.Tab("📈 Mean Difference"):
+                gr.Markdown("### Mean Activation Differences Across Layers")
+                gr.Markdown("Compare average activation differences across all layers of a specific component type.")
+                with gr.Row():
+                    # Left column: Configuration
+                    with gr.Column(scale=1):
+                        # Predefined scenarios dropdown (reutilizar del PCA)
+                        mean_scenario_dropdown = gr.Dropdown(
+                            choices=[(v["description"], k) for k, v in PREDEFINED_PROMPTS.items()],
+                            label="📋 Predefined Scenarios",
+                            value=list(PREDEFINED_PROMPTS.keys())[0]
+                        )
+                        # Prompt inputs
+                        mean_prompt1_input = gr.Textbox(
+                            label="Prompt 1",
+                            placeholder="Enter first prompt...",
+                            lines=2,
+                            value=PREDEFINED_PROMPTS[list(PREDEFINED_PROMPTS.keys())[0]]["prompt1"]
+                        )
+                        mean_prompt2_input = gr.Textbox(
+                            label="Prompt 2",
+                            placeholder="Enter second prompt...",
+                            lines=2,
+                            value=PREDEFINED_PROMPTS[list(PREDEFINED_PROMPTS.keys())[0]]["prompt2"]
+                        )
+                        # Component type configuration
+                        mean_component_dropdown = gr.Dropdown(
+                            choices=[
+                                ("Attention Output", "attention_output"),
+                                ("MLP Output", "mlp_output"),
+                                ("Gate Projection", "gate_proj"),
+                                ("Up Projection", "up_proj"),
+                                ("Down Projection", "down_proj"),
+                                ("Input Normalization", "input_norm")
+                            ],
+                            label="Component Type",
+                            value="attention_output",
+                            info="Type of neural network component to analyze"
+                        )
+                        # Generate button
+                        mean_diff_btn = gr.Button("📈 Generate Mean Difference Visualization", variant="primary", size="lg")
+                        # Status output
+                        mean_diff_status = gr.Textbox(
+                            label="Status",
+                            value="Configure parameters and click 'Generate Mean Difference Visualization'",
+                            interactive=False,
+                            lines=8,
+                            max_lines=10
+                        )
+                    # Right column: Results
+                    with gr.Column(scale=1):
+                        # Image display
+                        mean_diff_image = gr.Image(
+                            label="Mean Difference Visualization Result",
+                            type="filepath",
+                            show_label=True,
+                            show_download_button=True,
+                            interactive=False,
+                            height=400
+                        )
+                        # Download button (additional)
+                        download_mean_diff = gr.File(
+                            label="📥 Download Visualization",
+                            visible=False
+                        )
+                # Update prompts when scenario changes for Mean Difference
+                mean_scenario_dropdown.change(
+                    load_predefined_prompts,
+                    inputs=[mean_scenario_dropdown],
+                    outputs=[mean_prompt1_input, mean_prompt2_input]
+                )
+                # Connect the real Mean Difference function
+                mean_diff_btn.click(
+                    generate_mean_diff_visualization,
+                    inputs=[
+                        model_dropdown,         # Reutilizamos el selector de modelo global
+                        custom_model_input,     # Reutilizamos el campo de modelo custom global
+                        mean_scenario_dropdown,
+                        mean_prompt1_input,
+                        mean_prompt2_input,
+                        mean_component_dropdown,
+                    ],
+                    outputs=[mean_diff_image, mean_diff_status, download_mean_diff],
+                    show_progress=True
+                )
+            ###################
+            # Heatmap Tab
+            ##################
+            with gr.Tab("🔥 Heatmap"):
+                gr.Markdown("### Activation Difference Heatmap")
+                gr.Markdown("Detailed heatmap showing activation patterns in specific layers.")
+                with gr.Row():
+                    # Left column: Configuration
+                    with gr.Column(scale=1):
+                        # Predefined scenarios dropdown
+                        heatmap_scenario_dropdown = gr.Dropdown(
+                            choices=[(v["description"], k) for k, v in PREDEFINED_PROMPTS.items()],
+                            label="📋 Predefined Scenarios",
+                            value=list(PREDEFINED_PROMPTS.keys())[0]
+                        )
+                        # Prompt inputs
+                        heatmap_prompt1_input = gr.Textbox(
+                            label="Prompt 1",
+                            placeholder="Enter first prompt...",
+                            lines=2,
+                            value=PREDEFINED_PROMPTS[list(PREDEFINED_PROMPTS.keys())[0]]["prompt1"]
+                        )
+                        heatmap_prompt2_input = gr.Textbox(
+                            label="Prompt 2",
+                            placeholder="Enter second prompt...",
+                            lines=2,
+                            value=PREDEFINED_PROMPTS[list(PREDEFINED_PROMPTS.keys())[0]]["prompt2"]
+                        )
+                        # Component type configuration
+                        heatmap_component_dropdown = gr.Dropdown(
+                            choices=[
+                                ("Attention Output", "attention_output"),
+                                ("MLP Output", "mlp_output"),
+                                ("Gate Projection", "gate_proj"),
+                                ("Up Projection", "up_proj"),
+                                ("Down Projection", "down_proj"),
+                                ("Input Normalization", "input_norm")
+                            ],
+                            label="Component Type",
+                            value="attention_output",
+                            info="Type of neural network component to analyze"
+                        )
+                        # Layer number configuration
+                        heatmap_layer_number = gr.Number(
+                            label="Layer Number",
+                            value=7,
+                            minimum=0,
+                            step=1,
+                            info="Layer index - varies by model (e.g., 0-15 for small models)"
+                        )
+                        # Generate button
+                        heatmap_btn = gr.Button("🔥 Generate Heatmap Visualization", variant="primary", size="lg")
+                        # Status output
+                        heatmap_status = gr.Textbox(
+                            label="Status",
+                            value="Configure parameters and click 'Generate Heatmap Visualization'",
+                            interactive=False,
+                            lines=8,
+                            max_lines=10
+                        )
+                    # Right column: Results
+                    with gr.Column(scale=1):
+                        # Image display
+                        heatmap_image = gr.Image(
+                            label="Heatmap Visualization Result",
+                            type="filepath",
+                            show_label=True,
+                            show_download_button=True,
+                            interactive=False,
+                            height=400
+                        )
+                        # Download button (additional)
+                        download_heatmap = gr.File(
+                            label="📥 Download Visualization",
+                            visible=False
+                        )
+                # Update prompts when scenario changes for Heatmap
+                heatmap_scenario_dropdown.change(
+                    load_predefined_prompts,
+                    inputs=[heatmap_scenario_dropdown],
+                    outputs=[heatmap_prompt1_input, heatmap_prompt2_input]
+                )
+                # Connect the real Heatmap function
+                heatmap_btn.click(
+                    generate_heatmap_visualization,
+                    inputs=[
+                        model_dropdown,                # Reutilizamos el selector de modelo global
+                        custom_model_input,           # Reutilizamos el campo de modelo custom global
+                        heatmap_scenario_dropdown,
+                        heatmap_prompt1_input,
+                        heatmap_prompt2_input,
+                        heatmap_component_dropdown,
+                        heatmap_layer_number
+                    ],
+                    outputs=[heatmap_image, heatmap_status, download_heatmap],
+                    show_progress=True
+                )
+        # Footer
+        gr.Markdown("""
+        ---
+        **📚 How to use:**
+        1. Check that the backend is running
+        2. Select a predefined scenario or enter custom prompts
+        3. Configure layer settings
+        4. Generate visualizations to analyze potential biases
+        **🔗 Resources:** [OptiPFair Documentation](https://github.com/peremartra/optipfair) |
+        """)
+    return interface

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+fastapi==0.115.12
+uvicorn==0.34.2
+gradio==5.29.1
+requests==2.32.3
+optipfair[viz]==0.1.3
+torch==2.7.0
+transformers==4.51.3
+matplotlib==3.10.3
+numpy==1.26.4
+Pillow==11.2.1

routers/__pycache__/visualize.cpython-312.pyc ADDED Viewed

Binary file (5.4 kB). View file

routers/visualize.py ADDED Viewed

	@@ -0,0 +1,124 @@

+# routers/visualize.py
+import os
+import logging
+from fastapi import APIRouter, HTTPException
+from fastapi.responses import FileResponse
+from schemas.visualize import (
+    VisualizePCARequest,
+    VisualizeMeanDiffRequest,
+    VisualizeHeatmapRequest,
+)
+from utils.visualize_pca import (
+    run_visualize_pca,
+    run_visualize_mean_diff,
+    run_visualize_heatmap,
+)
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO)
+router = APIRouter(
+    prefix="/visualize",
+    tags=["visualization"],
+)
+@router.post(
+    "/pca",
+    summary="Generates and returns the PCA visualization of activations",
+    response_class=FileResponse,
+)
+async def visualize_pca_endpoint(req: VisualizePCARequest):
+    """
+    Receives the parameters, calls the wrapper for optipfair.bias.visualize_pca,
+    and returns the resulting PNG/SVG image.
+    """
+    # 1. Execute the image generation and get the file path
+    try:
+        filepath = run_visualize_pca(
+            model_name=req.model_name,
+            prompt_pair=tuple(req.prompt_pair),
+            layer_key=req.layer_key,
+            highlight_diff=req.highlight_diff,
+            output_dir=req.output_dir,
+            figure_format=req.figure_format,
+            pair_index=req.pair_index,
+        )
+    except Exception as e:
+        # Log the full trace for debugging
+        logger.exception("❌ Error in visualize_pca_endpoint")
+        # And return the message to the client
+        raise HTTPException(status_code=500, detail=str(e))
+    # 2. Verify that the file exists
+    if not filepath or not os.path.isfile(filepath):
+        raise HTTPException(status_code=500, detail="Image file not found after generation")
+    # 3. Return the file directly to the client
+    return FileResponse(
+        path=filepath,
+        media_type=f"image/{req.figure_format}",
+        filename=os.path.basename(filepath),
+        headers={"Content-Disposition": f'inline; filename="{os.path.basename(filepath)}"'},
+    )
+@router.post("/mean-diff", response_class=FileResponse)
+async def visualize_mean_diff_endpoint(req: VisualizeMeanDiffRequest):
+    """
+    Receives the parameters, calls the wrapper for optipfair.bias.visualize_mean_differences,
+    and returns the resulting PNG/SVG image.
+    """
+    try:
+        filepath = run_visualize_mean_diff(
+            model_name=req.model_name,
+            prompt_pair=tuple(req.prompt_pair),
+            layer_type=req.layer_type,  # Changed from layer_key to layer_type
+            figure_format=req.figure_format,
+            output_dir=req.output_dir,
+            pair_index=req.pair_index,
+        )
+    except Exception as e:
+        # Log the full trace for debugging
+        logger.exception("Error in mean-diff endpoint")
+        raise HTTPException(status_code=500, detail=str(e))
+    # Verify that the file exists
+    if not os.path.isfile(filepath):
+        raise HTTPException(status_code=500, detail="Image file not found")
+    # Return the file directly to the client
+    return FileResponse(
+        path=filepath,
+        media_type=f"image/{req.figure_format}",
+        filename=os.path.basename(filepath),
+        headers={"Content-Disposition": f'inline; filename="{os.path.basename(filepath)}"'}
+    )
+@router.post("/heatmap", response_class=FileResponse)
+async def visualize_heatmap_endpoint(req: VisualizeHeatmapRequest):
+    """
+    Receives the parameters, calls the wrapper for optipfair.bias.visualize_heatmap,
+    and returns the resulting PNG/SVG image.
+    """
+    try:
+        filepath = run_visualize_heatmap(
+            model_name=req.model_name,
+            prompt_pair=tuple(req.prompt_pair),
+            layer_key=req.layer_key,
+            figure_format=req.figure_format,
+            output_dir=req.output_dir,
+        )
+    except Exception as e:
+        # Log the full trace for debugging
+        logger.exception("Error in heatmap endpoint")
+        raise HTTPException(status_code=500, detail=str(e))
+    # Verify that the file exists
+    if not os.path.isfile(filepath):
+        raise HTTPException(status_code=500, detail="Image file not found")
+    # Return the file directly to the client
+    return FileResponse(
+        path=filepath,
+        media_type=f"image/{req.figure_format}",
+        filename=os.path.basename(filepath),
+        headers={"Content-Disposition": f'inline; filename="{os.path.basename(filepath)}"'}
+    )

schemas/__pycache__/visualize.cpython-312.pyc ADDED Viewed

Binary file (2.54 kB). View file

schemas/visualize.py ADDED Viewed

	@@ -0,0 +1,51 @@

+# schemas/visualize.py
+from pydantic import BaseModel, field_validator
+from typing import List, Optional, Union, Tuple
+class VisualizePCARequest(BaseModel):
+    """
+    Schema for the /visualize-pca endpoint.
+    """
+    model_name: str
+    prompt_pair: List[str]
+    layer_key: str
+    highlight_diff: bool = True
+    figure_format: str = "png"
+    pair_index: int = 0
+    output_dir: Optional[str] = None
+    @field_validator("prompt_pair")
+    def must_be_two_prompts(cls, v):
+        if len(v) != 2:
+            raise ValueError("prompt_pair must be a list of exactly two strings")
+        return v
+class VisualizeMeanDiffRequest(BaseModel):
+    model_name: str
+    prompt_pair: List[str]
+    layer_type: str  # Changed from layer_key to layer_type
+    figure_format: str = "png"
+    output_dir: Optional[str] = None
+    pair_index: int = 0
+    @field_validator("prompt_pair")
+    def must_be_two_prompts(cls, v):
+        if len(v) != 2:
+            raise ValueError("prompt_pair must be a list of exactly two strings")
+        return v
+class VisualizeHeatmapRequest(BaseModel):
+    """
+    Schema for the /visualize/heatmap endpoint.
+    """
+    model_name: str
+    prompt_pair: List[str]
+    layer_key: str
+    figure_format: str = "png"
+    output_dir: Optional[str] = None
+    @field_validator("prompt_pair")
+    def must_be_two_prompts(cls, v):
+        if len(v) != 2:
+            raise ValueError("prompt_pair must be a list of exactly two strings")
+        return v

utils/__pycache__/visualize_pca.cpython-312.pyc ADDED Viewed

Binary file (6.65 kB). View file

utils/visualize_pca.py ADDED Viewed

	@@ -0,0 +1,182 @@

+# utils/visualize_pca.py
+import os
+import tempfile
+import logging
+from functools import lru_cache
+from typing import Tuple, Optional, Union, List
+import torch
+from optipfair.bias import visualize_pca, visualize_mean_differences, visualize_heatmap
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import matplotlib
+matplotlib.use('Agg')  # Use 'Agg' backend for non-GUI environments
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO)
+@lru_cache(maxsize=None)
+def load_model_tokenizer(model_name: str):
+    """
+    Loads the model and tokenizer on the CPU once and caches the result.
+    """
+    logger.info(f"Loading model and tokenizer for '{model_name}'")
+    # Device selection: MPS (Apple Silicon) > CUDA > CPU
+    if torch.cuda.is_available():
+        device = torch.device("cuda")
+    elif torch.mps.is_available():
+        device = torch.device("mps")
+    else:
+        device = torch.device("cpu")
+    logger.info(f"Using device: {device}")
+    model = AutoModelForCausalLM.from_pretrained(model_name)
+    tokenizer = AutoTokenizer.from_pretrained(model_name)
+    model = model.to(device)
+    logger.info(f"Model loaded on device: {next(model.parameters()).device}")
+    return model, tokenizer
+def run_visualize_pca(
+    model_name: str,
+    prompt_pair: Tuple[str, str],
+    layer_key: str,
+    highlight_diff: bool = True,
+    output_dir: Optional[str] = None,
+    figure_format: str = "png",
+    pair_index: int = 0,
+) -> str:
+    if output_dir is None:
+        output_dir = tempfile.mkdtemp(prefix="optipfair_pca_")
+    os.makedirs(output_dir, exist_ok=True)
+    model, tokenizer = load_model_tokenizer(model_name)
+    visualize_pca(
+        model=model,
+        tokenizer=tokenizer,
+        prompt_pair=prompt_pair,
+        layer_key=layer_key,
+        highlight_diff=highlight_diff,
+        output_dir=output_dir,
+        figure_format=figure_format,
+        pair_index=pair_index
+    )
+    layer_parts = layer_key.split("_")
+    layer_type = "_".join(layer_parts[:-1])
+    layer_num = layer_parts[-1]
+    filename = build_visualization_filename(
+        vis_type="pca",
+        layer_type=layer_type,
+        layer_num=layer_num,
+        pair_index=pair_index,
+        figure_format=figure_format
+    )
+    filepath = os.path.join(output_dir, filename)
+    if not os.path.isfile(filepath):
+        raise FileNotFoundError(f"Expected image file not found: {filepath}")
+    logger.info(f"PCA image saved at {filepath}")
+    return filepath
+def run_visualize_mean_diff(
+    model_name: str,
+    prompt_pair: Tuple[str, str],
+    layer_type: str,  # Changed from layer_key to layer_type
+    figure_format: str = "png",
+    output_dir: Optional[str] = None,
+    pair_index: int = 0,
+) -> str:
+    if output_dir is None:
+        output_dir = tempfile.mkdtemp(prefix="optipfair_mean_diff_")
+    os.makedirs(output_dir, exist_ok=True)
+    model, tokenizer = load_model_tokenizer(model_name)
+    visualize_mean_differences(
+        model=model,
+        tokenizer=tokenizer,
+        prompt_pair=prompt_pair,
+        layer_type=layer_type,
+        layers="all",  # By default, show all layers
+        output_dir=output_dir,
+        figure_format=figure_format,
+        pair_index=pair_index
+    )
+    filename = build_visualization_filename(
+        vis_type="mean_diff",
+        layer_type=layer_type,
+        pair_index=pair_index,
+        figure_format=figure_format
+    )
+    filepath = os.path.join(output_dir, filename)
+    if not os.path.isfile(filepath):
+        raise FileNotFoundError(f"Expected image file not found: {filepath}")
+    logger.info(f"Mean-diff image saved at {filepath}")
+    return filepath
+def run_visualize_heatmap(
+    model_name: str,
+    prompt_pair: Tuple[str, str],
+    layer_key: str,
+    figure_format: str = "png",
+    output_dir: Optional[str] = None,
+    pair_index: int = 0,
+) -> str:
+    if output_dir is None:
+        output_dir = tempfile.mkdtemp(prefix="optipfair_heatmap_")
+    os.makedirs(output_dir, exist_ok=True)
+    model, tokenizer = load_model_tokenizer(model_name)
+    visualize_heatmap(
+        model=model,
+        tokenizer=tokenizer,
+        prompt_pair=prompt_pair,
+        layer_key=layer_key,
+        output_dir=output_dir,
+        figure_format=figure_format,
+        pair_index=pair_index
+    )
+    parts = layer_key.split("_")
+    layer_type = "_".join(parts[:-1])
+    layer_num = parts[-1]
+    filename = build_visualization_filename(
+        vis_type="heatmap",
+        layer_type=layer_type,
+        layer_num=layer_num,
+        pair_index=pair_index,
+        figure_format=figure_format
+    )
+    filepath = os.path.join(output_dir, filename)
+    if not os.path.isfile(filepath):
+        raise FileNotFoundError(f"Expected image file not found: {filepath}")
+    logger.info(f"Heatmap image saved at {filepath}")
+    return filepath
+def build_visualization_filename(
+    vis_type: str,
+    layer_type: str,
+    layer_num: str = None,
+    layers: Union[str, List[int]] = None,
+    pair_index: int = 0,
+    figure_format: str = "png"
+) -> str:
+    """
+    Builds the filename for any visualization.
+    """
+    if vis_type == "mean_diff":
+        # The visualize_mean_differences function does not include the layer number in the filename
+        return f"mean_diff_{layer_type}_pair{pair_index}.{figure_format}"
+    elif vis_type in ("pca", "heatmap"):
+        return f"{vis_type}_{layer_type}_{layer_num}_pair{pair_index}.{figure_format}"
+    else:
+        raise ValueError(f"Unknown visualization type: {vis_type}")