Spaces:

walaa2022
/

lumenex

Sleeping

App Files Files Community

walaa2022 commited on May 29

Commit

644aa62

verified ·

1 Parent(s): 815f7ad

Update app.py

Browse files

Files changed (1) hide show

app.py +268 -433

app.py CHANGED Viewed

@@ -1,461 +1,296 @@
-# app.py - Fixed MedGemma Implementation Based on Google's Official Approach
 import gradio as gr
 import torch
-import os
-import logging
-import json
-import requests
 from PIL import Image
-import base64
-import io
-from huggingface_hub import login
-from collections import defaultdict, Counter
-import time
-# Configure logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-# Usage tracking
-class UsageTracker:
     def __init__(self):
-        self.stats = {
-            'total_analyses': 0,
-            'successful_analyses': 0,
-            'failed_analyses': 0,
-            'average_processing_time': 0.0,
-            'question_types': Counter()
         }
-    def log_analysis(self, success, duration, question_type=None):
-        self.stats['total_analyses'] += 1
-        if success:
-            self.stats['successful_analyses'] += 1
-        else:
-            self.stats['failed_analyses'] += 1
-        total_time = self.stats['average_processing_time'] * (self.stats['total_analyses'] - 1)
-        self.stats['average_processing_time'] = (total_time + duration) / self.stats['total_analyses']
-        if question_type:
-            self.stats['question_types'][question_type] += 1
-# Rate limiting
-class RateLimiter:
-    def __init__(self, max_requests_per_hour=50):
-        self.max_requests_per_hour = max_requests_per_hour
-        self.requests = defaultdict(list)
-    def is_allowed(self, user_id="default"):
-        current_time = time.time()
-        hour_ago = current_time - 3600
-        self.requests[user_id] = [req_time for req_time in self.requests[user_id] if req_time > hour_ago]
-        if len(self.requests[user_id]) < self.max_requests_per_hour:
-            self.requests[user_id].append(current_time)
-            return True
-        return False
-# Initialize components
-usage_tracker = UsageTracker()
-rate_limiter = RateLimiter()
-# MedGemma API Configuration
-MODEL_ID = "google/medgemma-4b-it"
-def authenticate_hf():
-    """Authenticate with Hugging Face"""
-    try:
-        hf_token = os.getenv('HF_TOKEN')
-        if hf_token:
-            login(token=hf_token)
-            logger.info("✅ Authenticated with Hugging Face")
-            return True, hf_token
-        else:
-            logger.warning("⚠️ No HF_TOKEN found")
-            return False, None
-    except Exception as e:
-        logger.error(f"❌ Authentication failed: {e}")
-        return False, None
-def image_to_base64(image):
-    """Convert PIL image to base64 string"""
-    try:
-        buffer = io.BytesIO()
-        image.save(buffer, format='PNG')
-        img_str = base64.b64encode(buffer.getvalue()).decode()
-        return f"data:image/png;base64,{img_str}"
-    except Exception as e:
-        logger.error(f"Error converting image: {e}")
-        return None
-def call_medgemma_api(image, prompt, patient_history="", hf_token=None):
-    """Call MedGemma using Hugging Face Inference API"""
-    try:
-        # Use HF Inference API endpoint
-        api_url = f"https://api-inference.huggingface.co/models/{MODEL_ID}"
-        headers = {
-            "Authorization": f"Bearer {hf_token}",
-            "Content-Type": "application/json"
-        }
-        # Prepare the payload following Google's format
-        system_instruction = "You are an expert medical AI assistant specialized in medical image analysis. Provide detailed analysis for educational purposes only."
-        # Build the full prompt
-        full_prompt = system_instruction + " "
-        if patient_history.strip():
-            full_prompt += f"Patient History: {patient_history} "
-        full_prompt += prompt
-        # Convert image to base64
-        image_b64 = image_to_base64(image)
-        if not image_b64:
-            return None, "Failed to process image"
-        # Prepare the request payload
-        payload = {
-            "inputs": {
-                "prompt": full_prompt,
-                "multi_modal_data": {
-                    "image": image_b64
-                },
-                "max_tokens": 1000,
-                "temperature": 0.3,
-                "raw_response": True
-            }
-        }
-        # Make the API call
-        response = requests.post(api_url, headers=headers, json=payload, timeout=120)
-        if response.status_code == 200:
-            result = response.json()
-            if isinstance(result, list) and len(result) > 0:
-                return result[0].get('generated_text', ''), None
-            elif isinstance(result, dict):
-                return result.get('generated_text', result.get('text', str(result))), None
             else:
-                return str(result), None
-        else:
-            error_msg = f"API Error {response.status_code}: {response.text}"
-            logger.error(error_msg)
-            return None, error_msg
-    except requests.exceptions.Timeout:
-        return None, "Request timeout - model may be loading"
-    except Exception as e:
-        logger.error(f"API call failed: {e}")
-        return None, str(e)
-def analyze_medical_image_medgemma(image, clinical_question, patient_history=""):
-    """Main analysis function using MedGemma"""
-    start_time = time.time()
-    # Rate limiting
-    if not rate_limiter.is_allowed():
-        usage_tracker.log_analysis(False, time.time() - start_time)
-        return "⚠️ Too many requests. Please wait before trying again."
-    # Validate inputs
-    if image is None:
-        return "⚠️ Please upload a medical image first."
-    if not clinical_question.strip():
-        return "⚠️ Please provide a clinical question."
-    # Authenticate
-    auth_success, hf_token = authenticate_hf()
-    if not auth_success or not hf_token:
-        usage_tracker.log_analysis(False, time.time() - start_time)
-        return """❌ **Authentication Required**
-To use MedGemma, you need:
-1. Access to the model at https://huggingface.co/google/medgemma-4b-it
-2. HF_TOKEN set in Space Settings → Repository secrets
-**Current Status**: Authentication failed - cannot access MedGemma."""
-    try:
-        logger.info("Calling MedGemma API...")
-        # Call MedGemma API
-        response_text, error = call_medgemma_api(
-            image=image,
-            prompt=clinical_question,
-            patient_history=patient_history,
-            hf_token=hf_token
-        )
-        if error:
-            usage_tracker.log_analysis(False, time.time() - start_time)
-            return f"""❌ **MedGemma API Error**
-{error}
-**Possible solutions:**
-1. The model may be loading - try again in a few minutes
-2. Check if you have proper access to MedGemma
-3. Verify your HF_TOKEN is valid
-**Note**: MedGemma is a gated model and may have usage limits."""
-        if not response_text:
-            usage_tracker.log_analysis(False, time.time() - start_time)
-            return "❌ No response from MedGemma. Please try again."
-        # Clean up response
-        response_text = response_text.strip()
-        # Add medical disclaimer
-        disclaimer = """
----
-### ⚠️ MEDICAL DISCLAIMER
-**This analysis is for educational and research purposes only.**
-- This AI assistant is not a substitute for professional medical advice
-- Always consult qualified healthcare professionals for diagnosis and treatment
-- Do not make medical decisions based solely on this analysis
-- In case of medical emergency, contact emergency services immediately
----
-**Powered by**: Google MedGemma-4B via Hugging Face Inference API
-        """
-        # Log successful analysis
-        duration = time.time() - start_time
-        question_type = classify_question(clinical_question)
-        usage_tracker.log_analysis(True, duration, question_type)
-        logger.info("✅ MedGemma analysis completed successfully")
-        return response_text + disclaimer
-    except Exception as e:
-        duration = time.time() - start_time
-        usage_tracker.log_analysis(False, duration)
-        logger.error(f"❌ Analysis error: {str(e)}")
-        return f"❌ Analysis failed: {str(e)}\n\nPlease try again or use a different image."
-def classify_question(question):
-    """Classify clinical question type"""
-    question_lower = question.lower()
-    if any(word in question_lower for word in ['describe', 'findings', 'observe']):
-        return 'descriptive'
-    elif any(word in question_lower for word in ['diagnosis', 'differential', 'condition']):
-        return 'diagnostic'
-    elif any(word in question_lower for word in ['abnormal', 'pathology', 'disease']):
-        return 'pathological'
-    else:
-        return 'general'
-def get_usage_stats():
-    """Get usage statistics"""
-    stats = usage_tracker.stats
-    if stats['total_analyses'] == 0:
-        return "📊 **Usage Statistics**\n\nNo analyses performed yet."
-    success_rate = (stats['successful_analyses'] / stats['total_analyses']) * 100
-    return f"""📊 **Usage Statistics**
-**Performance:**
-- Total Analyses: {stats['total_analyses']}
-- Success Rate: {success_rate:.1f}%
-- Avg Processing Time: {stats['average_processing_time']:.2f}s
-**Popular Question Types:**
-{chr(10).join([f"- {qtype}: {count}" for qtype, count in stats['question_types'].most_common(3)])}
-"""
-# Create Gradio interface
-def create_interface():
-    # Check authentication status
-    auth_success, _ = authenticate_hf()
-    with gr.Blocks(
-        title="MedGemma Medical Analysis",
-        theme=gr.themes.Soft(),
-        css="""
-        .gradio-container { max-width: 1200px !important; }
-        .disclaimer { background-color: #fef2f2; border: 1px solid #fecaca; border-radius: 8px; padding: 16px; margin: 16px 0; }
-        .success { background-color: #f0f9ff; border: 1px solid #bae6fd; border-radius: 8px; padding: 16px; margin: 16px 0; }
-        .warning { background-color: #fffbeb; border: 1px solid #fed7aa; border-radius: 8px; padding: 16px; margin: 16px 0; }
-        """
-    ) as demo:
-        # Header
-        gr.Markdown("""
-        # 🏥 MedGemma Medical Image Analysis
-        **Google's Medical AI Assistant - MedGemma-4B**
-        Specialized medical AI trained specifically for:
-        🫁 **Radiology** • 🔬 **Histopathology** • 👁️ **Ophthalmology** • 🩺 **Dermatology**
-        """)
-        # Status display
-        if auth_success:
-            gr.Markdown("""
-            <div class="success">
-            ✅ <strong>MEDGEMMA READY</strong><br>
-            Authenticated with Google's MedGemma-4B model. Ready for professional medical image analysis.
-            </div>
-            """)
-        else:
-            gr.Markdown("""
-            <div class="warning">
-            🔐 <strong>AUTHENTICATION REQUIRED</strong><br>
-            Please ensure HF_TOKEN is set in Space Settings → Repository secrets and you have access to MedGemma.
-            </div>
-            """)
-        # Medical disclaimer
-        gr.Markdown("""
-        <div class="disclaimer">
-        ⚠️ <strong>IMPORTANT MEDICAL DISCLAIMER</strong><br>
-        This tool is for <strong>educational and research purposes only</strong>.
-        Do not upload real patient data. Always consult qualified healthcare professionals.
-        </div>
-        """)
-        with gr.Row():
-            # Left column
-            with gr.Column(scale=2):
-                with gr.Row():
-                    with gr.Column():
-                        gr.Markdown("## 📤 Medical Image")
-                        image_input = gr.Image(
-                            label="Upload Medical Image",
-                            type="pil",
-                            height=300
-                        )
-                    with gr.Column():
-                        gr.Markdown("## 💬 Clinical Query")
-                        clinical_question = gr.Textbox(
-                            label="Clinical Question *",
-                            placeholder="Examples:\n• Describe this X-ray systematically\n• What pathological changes are visible?\n• Provide differential diagnosis\n• Assess image quality and findings",
-                            lines=4
-                        )
-                        patient_history = gr.Textbox(
-                            label="Patient History (Optional)",
-                            placeholder="e.g., 65-year-old male with chronic cough, smoking history",
-                            lines=2
                         )
-                with gr.Row():
-                    clear_btn = gr.Button("🗑️ Clear", variant="secondary")
-                    analyze_btn = gr.Button("🔍 Analyze with MedGemma", variant="primary", size="lg")
-                gr.Markdown("## 📋 MedGemma Analysis")
-                output = gr.Textbox(
-                    label="Medical AI Analysis Results",
-                    lines=20,
-                    show_copy_button=True,
-                    placeholder="Upload a medical image and ask a clinical question to get started..."
-                )
-            # Right column - System info
-            with gr.Column(scale=1):
-                gr.Markdown("## ℹ️ System Status")
-                auth_status = "✅ Authenticated" if auth_success else "🔐 Auth Required"
-                gr.Markdown(f"""
-                **Authentication:** {auth_status}
-                **Model:** Google MedGemma-4B
-                **API:** Hugging Face Inference
-                **Status:** {'Ready' if auth_success else 'Setup Required'}
-                """)
-                gr.Markdown("## 📊 Usage Statistics")
-                stats_display = gr.Markdown("")
-                refresh_stats_btn = gr.Button("🔄 Refresh Stats", size="sm")
-                gr.Markdown("## 🎯 Quick Examples")
-                chest_btn = gr.Button("Chest X-ray", size="sm")
-                pathology_btn = gr.Button("Pathology", size="sm")
-                diagnosis_btn = gr.Button("Diagnosis", size="sm")
-        # Example cases
-        with gr.Accordion("📚 Medical Cases", open=False):
-            examples = gr.Examples(
-                examples=[
-                    [
-                        "https://upload.wikimedia.org/wikipedia/commons/c/c8/Chest_Xray_PA_3-8-2010.png",
-                        "You are an expert radiologist. Describe this X-ray systematically including heart size, lung fields, and any abnormalities.",
-                        "Adult patient with respiratory symptoms"
-                    ]
-                ],
-                inputs=[image_input, clinical_question, patient_history]
-            )
-        # Event handlers
-        analyze_btn.click(
-            fn=analyze_medical_image_medgemma,
-            inputs=[image_input, clinical_question, patient_history],
-            outputs=output,
-            show_progress=True
-        )
-        clear_btn.click(
-            fn=lambda: (None, "", "", ""),
-            outputs=[image_input, clinical_question, patient_history, output]
-        )
-        refresh_stats_btn.click(
-            fn=get_usage_stats,
-            outputs=stats_display
-        )
-        # Quick example handlers
-        chest_btn.click(
-            fn=lambda: ("Analyze this chest X-ray systematically. Comment on cardiac silhouette, lung fields, mediastinum, and any pathological findings.", "Adult with respiratory symptoms"),
-            outputs=[clinical_question, patient_history]
-        )
-        pathology_btn.click(
-            fn=lambda: ("What pathological changes are visible in this medical image? Provide structured analysis with clinical significance.", ""),
-            outputs=[clinical_question, patient_history]
-        )
-        diagnosis_btn.click(
-            fn=lambda: ("Based on the imaging findings, what are the most likely differential diagnoses? Consider clinical context.", "Patient with acute presentation"),
-            outputs=[clinical_question, patient_history]
-        )
-        # Footer
-        gr.Markdown("""
-        ---
-        ### 🔬 About MedGemma
-        **MedGemma-4B** is Google's specialized medical AI model designed specifically for medical image analysis and clinical reasoning.
-        It represents state-of-the-art performance in medical AI applications.
-        **Key Features:**
-        - **Medical Specialization**: Trained specifically on medical imaging data
-        - **Multi-modal**: Handles both images and clinical text
-        - **Professional Grade**: Designed for medical education and research
-        - **Google Quality**: Built by Google's medical AI team
-        ### 🔒 Privacy & Compliance
-        - **Real-time processing** with no data retention
-        - **Educational purpose** design and disclaimers
-        - **HIPAA-aware** interface (no PHI uploads)
-        - **Professional standards** for medical AI applications
-        **Model:** Google MedGemma-4B | **API:** Hugging Face Inference | **License:** Apache 2.0
-        """)
-    return demo
-# Launch the app
 if __name__ == "__main__":
-    demo = create_interface()
-    demo.launch(
-        server_name="0.0.0.0",
-        server_port=7860,
-        show_error=True
-    )

 import gradio as gr
 import torch
+from transformers import (
+    AutoModelForCausalLM,
+    AutoModelForImageTextToText,
+    AutoTokenizer,
+    AutoProcessor,
+    BitsAndBytesConfig,
+    pipeline
+)
 from PIL import Image
+import os
+import spaces
+# Configuration
+MODEL_4B = "google/medgemma-4b-it"
+MODEL_27B = "google/medgemma-27b-text-it"
+class MedGemmaApp:
     def __init__(self):
+        self.current_model = None
+        self.current_tokenizer = None
+        self.current_processor = None
+        self.current_pipe = None
+        self.model_type = None
+    def get_model_kwargs(self, use_quantization=True):
+        """Get model configuration arguments"""
+        model_kwargs = {
+            "torch_dtype": torch.bfloat16,
+            "device_map": "auto",
         }
+        if use_quantization:
+            model_kwargs["quantization_config"] = BitsAndBytesConfig(load_in_4bit=True)
+        return model_kwargs
+    @spaces.GPU
+    def load_model(self, model_choice, use_quantization=True):
+        """Load the selected model"""
+        try:
+            model_id = MODEL_4B if model_choice == "4B (Multimodal)" else MODEL_27B
+            model_kwargs = self.get_model_kwargs(use_quantization)
+            # Clear previous model
+            if self.current_model is not None:
+                del self.current_model
+                del self.current_tokenizer
+                if self.current_processor:
+                    del self.current_processor
+                if self.current_pipe:
+                    del self.current_pipe
+                torch.cuda.empty_cache()
+            if model_choice == "4B (Multimodal)":
+                # Load multimodal model
+                self.current_model = AutoModelForImageTextToText.from_pretrained(
+                    model_id, **model_kwargs
+                )
+                self.current_processor = AutoProcessor.from_pretrained(model_id)
+                self.model_type = "multimodal"
+                # Create pipeline for easier inference
+                self.current_pipe = pipeline(
+                    "image-text-to-text",
+                    model=self.current_model,
+                    processor=self.current_processor,
+                )
+                self.current_pipe.model.generation_config.do_sample = False
             else:
+                # Load text-only model
+                self.current_model = AutoModelForCausalLM.from_pretrained(
+                    model_id, **model_kwargs
+                )
+                self.current_tokenizer = AutoTokenizer.from_pretrained(model_id)
+                self.model_type = "text"
+                # Create pipeline for easier inference
+                self.current_pipe = pipeline(
+                    "text-generation",
+                    model=self.current_model,
+                    tokenizer=self.current_tokenizer,
+                )
+                self.current_pipe.model.generation_config.do_sample = False
+            return f"✅ Successfully loaded {model_choice} model!"
+        except Exception as e:
+            return f"❌ Error loading model: {str(e)}"
+    @spaces.GPU
+    def chat_text_only(self, message, history, system_instruction="You are a helpful medical assistant."):
+        """Handle text-only conversations"""
+        if self.current_model is None or self.model_type != "text":
+            return "Please load the 27B (Text Only) model first!"
+        try:
+            messages = [
+                {"role": "system", "content": system_instruction},
+                {"role": "user", "content": message}
+            ]
+            # Add conversation history
+            for human, assistant in history:
+                messages.insert(-1, {"role": "user", "content": human})
+                messages.insert(-1, {"role": "assistant", "content": assistant})
+            output = self.current_pipe(messages, max_new_tokens=500)
+            response = output[0]["generated_text"][-1]["content"]
+            return response
+        except Exception as e:
+            return f"Error generating response: {str(e)}"
+    @spaces.GPU
+    def chat_with_image(self, message, image, system_instruction="You are an expert radiologist."):
+        """Handle image + text conversations"""
+        if self.current_model is None or self.model_type != "multimodal":
+            return "Please load the 4B (Multimodal) model first!"
+        if image is None:
+            return "Please upload an image to analyze."
+        try:
+            messages = [
+                {
+                    "role": "system",
+                    "content": [{"type": "text", "text": system_instruction}]
+                },
+                {
+                    "role": "user",
+                    "content": [
+                        {"type": "text", "text": message},
+                        {"type": "image", "image": image}
+                    ]
+                }
+            ]
+            output = self.current_pipe(text=messages, max_new_tokens=300)
+            response = output[0]["generated_text"][-1]["content"]
+            return response
+        except Exception as e:
+            return f"Error analyzing image: {str(e)}"
+# Initialize the app
+app = MedGemmaApp()
+# Create Gradio interface
+with gr.Blocks(title="MedGemma Medical AI Assistant", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("""
+    # 🏥 MedGemma Medical AI Assistant
+    Welcome to MedGemma, Google's medical AI assistant! Choose between:
+    - **4B Multimodal**: Analyze medical images (X-rays, scans) with text
+    - **27B Text-Only**: Advanced medical text conversations
+    > **Note**: This is for educational and research purposes only. Always consult healthcare professionals for medical advice.
+    """)
+    with gr.Row():
+        with gr.Column(scale=1):
+            model_choice = gr.Radio(
+                choices=["4B (Multimodal)", "27B (Text Only)"],
+                value="4B (Multimodal)",
+                label="Select Model",
+                info="4B supports images, 27B is text-only but more powerful"
+            )
+            use_quantization = gr.Checkbox(
+                value=True,
+                label="Use 4-bit Quantization",
+                info="Reduces memory usage (recommended)"
+            )
+            load_btn = gr.Button("🚀 Load Model", variant="primary")
+            model_status = gr.Textbox(label="Model Status", interactive=False)
+    with gr.Tabs():
+        # Text-only chat tab
+        with gr.Tab("💬 Text Chat", id="text_chat"):
+            gr.Markdown("### Medical Text Consultation")
+            with gr.Row():
+                with gr.Column(scale=3):
+                    text_system = gr.Textbox(
+                        value="You are a helpful medical assistant.",
+                        label="System Instruction",
+                        placeholder="Set the AI's role and behavior..."
+                    )
+                    chatbot_text = gr.Chatbot(
+                        height=400,
+                        placeholder="Start a medical conversation...",
+                        label="Medical Assistant"
+                    )
+                    with gr.Row():
+                        text_input = gr.Textbox(
+                            placeholder="Ask a medical question...",
+                            label="Your Question",
+                            scale=4
                         )
+                        text_submit = gr.Button("Send", scale=1)
+                with gr.Column(scale=1):
+                    gr.Markdown("""
+                    ### 💡 Example Questions:
+                    - How do you differentiate bacterial from viral pneumonia?
+                    - What are the symptoms of diabetes?
+                    - Explain the mechanism of action of ACE inhibitors
+                    - What are the contraindications for MRI?
+                    """)
+        # Image analysis tab
+        with gr.Tab("🖼️ Image Analysis", id="image_analysis"):
+            gr.Markdown("### Medical Image Analysis")
+            with gr.Row():
+                with gr.Column(scale=2):
+                    image_input = gr.Image(
+                        type="pil",
+                        label="Upload Medical Image",
+                        height=300
+                    )
+                    image_system = gr.Textbox(
+                        value="You are an expert radiologist.",
+                        label="System Instruction"
+                    )
+                    image_text_input = gr.Textbox(
+                        value="Describe this X-ray",
+                        label="Question about the image",
+                        placeholder="What would you like to know about this image?"
+                    )
+                    image_submit = gr.Button("🔍 Analyze Image", variant="primary")
+                with gr.Column(scale=2):
+                    image_output = gr.Textbox(
+                        label="Analysis Result",
+                        lines=15,
+                        placeholder="Upload an image and click 'Analyze Image' to see the AI's analysis..."
+                    )
+    # Event handlers
+    load_btn.click(
+        fn=app.load_model,
+        inputs=[model_choice, use_quantization],
+        outputs=[model_status]
+    )
+    def respond_text(message, history, system_instruction):
+        if message.strip() == "":
+            return history, ""
+        response = app.chat_text_only(message, history, system_instruction)
+        history.append((message, response))
+        return history, ""
+    text_submit.click(
+        fn=respond_text,
+        inputs=[text_input, chatbot_text, text_system],
+        outputs=[chatbot_text, text_input]
+    )
+    text_input.submit(
+        fn=respond_text,
+        inputs=[text_input, chatbot_text, text_system],
+        outputs=[chatbot_text, text_input]
+    )
+    image_submit.click(
+        fn=app.chat_with_image,
+        inputs=[image_text_input, image_input, image_system],
+        outputs=[image_output]
+    )
+    # Example image loading
+    gr.Markdown("""
+    ---
+    ### 📚 About MedGemma
+    MedGemma is a collection of Gemma variants trained for medical applications.
+    Learn more at the [HAI-DEF developer site](https://developers.google.com/health-ai-developer-foundations/medgemma).
+    **Disclaimer**: This tool is for educational and research purposes only.
+    Always consult qualified healthcare professionals for medical advice.
+    """)
 if __name__ == "__main__":
+    demo.launch()