Spaces:

arjunkmoorthy
/

medbot-space

Runtime error

App Files Files Community

Arjun Moorthy commited on 28 days ago

Commit

da47961

1 Parent(s): cefbc35

Clean up repository and fix file locations

Browse files

Files changed (3) hide show

Oncolife/requirements.txt +0 -20
README.md +1 -1
app.py +0 -259

Oncolife/requirements.txt DELETED Viewed

@@ -1,20 +0,0 @@
-# Medical Chatbot HF Space Requirements
-# Web framework
-gradio>=4.44.0
-# Machine learning libraries - specific versions for compatibility
-torch>=2.1.0,<3.0.0
-transformers>=4.35.0,<5.0.0
-accelerate>=0.24.0
-# HF Spaces GPU support
-spaces>=0.1.0
-# Basic utilities
-numpy>=1.21.0,<2.0.0
-requests>=2.28.0
-# Additional dependencies for better device handling
-safetensors>=0.4.0
-tokenizers>=0.15.0

README.md CHANGED Viewed

@@ -6,7 +6,7 @@ colorTo: green
 sdk: gradio
 sdk_version: 4.44.0
 app_file: Oncolife/app.py
-requirements_file: Oncolife/requirements.txt
 pinned: false
 ---

 sdk: gradio
 sdk_version: 4.44.0
 app_file: Oncolife/app.py
+requirements_file: requirements.txt
 pinned: false
 ---

app.py DELETED Viewed

@@ -1,259 +0,0 @@
-#!/usr/bin/env python3
-"""
-OncoLife Symptom & Triage Assistant
-A medical chatbot that performs both symptom assessment and clinical triage for chemotherapy patients.
-Updated: Using BioMistral-7B base model for medical conversations.
-REBUILD: Simplified to use only base model, no adapters.
-"""
-import gradio as gr
-import os
-import json
-from transformers import AutoTokenizer, MistralForCausalLM
-import torch
-from spaces import GPU
-# Force GPU detection for HF Spaces
-@GPU
-def force_gpu_detection():
-    """Force GPU detection for Hugging Face Spaces"""
-    return torch.cuda.is_available()
-class OncoLifeAssistant:
-    def __init__(self):
-        # BioMistral base model configuration
-        BASE = "BioMistral/BioMistral-7B"
-        print("🔄 Initializing OncoLife Symptom & Triage Assistant")
-        print(f"📦 Loading base model: {BASE}")
-        # Force GPU detection first
-        try:
-            gpu_available = force_gpu_detection()
-            print(f"🖥️ GPU Detection: {gpu_available}")
-        except Exception as e:
-            print(f"⚠️ GPU detection error: {e}")
-            gpu_available = torch.cuda.is_available()
-        self._load_model(BASE, gpu_available)
-        # Initialize conversation state
-        self.conversation_state = {
-            "symptoms": [],
-            "asked_ids": [],
-            "answers": {},
-            "current_symptom": None,
-            "conversation_phase": "initial"  # initial, symptom_assessment, triage, summary
-        }
-    def _load_model(self, model_id, gpu_available):
-        """Load the BioMistral base model"""
-        try:
-            print("🔄 Loading BioMistral base model...")
-            # Determine device strategy
-            if gpu_available and torch.cuda.is_available():
-                device = "cuda"
-                dtype = torch.float16
-                print("🖥️ Loading BioMistral model on GPU...")
-            else:
-                device = "cpu"
-                dtype = torch.float32
-                print("💻 Loading BioMistral model on CPU...")
-            # Load tokenizer
-            print(f"📝 Loading tokenizer: {model_id}")
-            self.tokenizer = AutoTokenizer.from_pretrained(
-                model_id,
-                trust_remote_code=True
-            )
-            # Load the model
-            print(f"📦 Loading model: {model_id}")
-            self.model = MistralForCausalLM.from_pretrained(
-                model_id,
-                trust_remote_code=True,
-                device_map="auto",
-                torch_dtype=dtype,
-                low_cpu_mem_usage=True
-            )
-            # Add pad token if not present
-            if self.tokenizer.pad_token is None:
-                self.tokenizer.pad_token = self.tokenizer.eos_token
-            print(f"✅ BioMistral base model loaded successfully on {device.upper()}!")
-        except Exception as e:
-            print(f"❌ Error loading BioMistral model: {e}")
-            self.model = None
-            self.tokenizer = None
-    def generate_oncolife_response(self, user_input, conversation_history):
-        """Generate response using OncoLife Symptom & Triage Assistant protocol"""
-        try:
-            if self.model is None or self.tokenizer is None:
-                return """❌ **Model Loading Error**
-The OncoLife assistant model failed to load. This could be due to:
-1. Model not available
-2. Memory constraints
-3. Network issues
-Please check the Space logs for details."""
-            print(f"🔄 Generating OncoLife response for: {user_input}")
-            # Create OncoLife-specific prompt
-            system_prompt = """You are the OncoLife Symptom & Triage Assistant, a medical chatbot that performs both symptom assessment and clinical triage for chemotherapy patients. Your task is to guide users through structured symptom reporting and decide whether any responses require escalation to their care team.
-Follow this workflow:
-1. Ask for symptoms if none provided
-2. For each symptom, ask severity rating (mild/moderate/severe)
-3. Check for red flags and immediate escalation needs
-4. Grade severity using CTCAE or UKONS criteria
-5. Ask targeted questions based on utility scoring
-6. Provide structured summary with triage recommendations
-Safety protocols:
-- Never provide medical advice or treatment recommendations
-- Always redirect to oncology team for medical decisions
-- Escalate immediately for dangerous symptoms
-- Add legal disclaimer at session end
-Current conversation state: {conversation_state}"""
-            # Format conversation history
-            history_text = ""
-            if conversation_history:
-                for entry in conversation_history:
-                    history_text += f"User: {entry['user']}\nAssistant: {entry['assistant']}\n\n"
-            # Create full prompt
-            prompt = f"{system_prompt}\n\nConversation History:\n{history_text}\nUser: {user_input}\nAssistant:"
-            # Tokenize
-            inputs = self.tokenizer(prompt, return_tensors="pt", padding=True)
-            # Get the device the model is actually on
-            model_device = next(self.model.parameters()).device
-            print(f"🔧 Model device: {model_device}")
-            # Move inputs to the same device as the model
-            for key in inputs:
-                if isinstance(inputs[key], torch.Tensor):
-                    inputs[key] = inputs[key].to(model_device)
-                    print(f"📦 Moved {key} to {model_device}")
-            # Ensure model is in eval mode
-            self.model.eval()
-            # Generate with proper device handling
-            with torch.no_grad():
-                try:
-                    outputs = self.model.generate(
-                        **inputs,
-                        max_new_tokens=512,  # Longer responses for detailed medical assessment
-                        temperature=0.7,
-                        do_sample=True,
-                        top_p=0.9,
-                        pad_token_id=self.tokenizer.eos_token_id,
-                        eos_token_id=self.tokenizer.eos_token_id
-                    )
-                except RuntimeError as e:
-                    if "device" in str(e).lower():
-                        print("🔄 Device error detected, trying CPU fallback...")
-                        # Move everything to CPU and try again
-                        self.model = self.model.to("cpu")
-                        for key in inputs:
-                            if isinstance(inputs[key], torch.Tensor):
-                                inputs[key] = inputs[key].to("cpu")
-                        outputs = self.model.generate(
-                            **inputs,
-                            max_new_tokens=512,
-                            temperature=0.7,
-                            do_sample=True,
-                            top_p=0.9,
-                            pad_token_id=self.tokenizer.eos_token_id,
-                            eos_token_id=self.tokenizer.eos_token_id
-                        )
-                    else:
-                        raise e
-            # Decode response
-            response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
-            # Extract just the assistant's response
-            if "Assistant:" in response:
-                answer = response.split("Assistant:")[-1].strip()
-            else:
-                answer = response.strip()
-            # Add legal disclaimer if this appears to be end of session
-            if any(keyword in user_input.lower() for keyword in ['done', 'finished', 'complete', 'summary']):
-                answer += "\n\n" + self._get_legal_disclaimer()
-            print("✅ OncoLife response generated successfully")
-            return answer
-        except Exception as e:
-            print(f"❌ Error generating OncoLife response: {e}")
-            return f"""❌ **Generation Error**
-Error: {str(e)}
-This could be due to:
-1. Model compatibility issues
-2. Memory constraints
-3. Input format problems
-Please try a simpler question or check the logs for more details."""
-    def _get_legal_disclaimer(self):
-        """Return the legal disclaimer as specified in the instructions"""
-        return """**Legal Disclaimer:**
-Patient verbalizes agreement with plan of care and understanding of the information we have gone over today and has no further comments, questions or concerns at this time. Will follow up with Doctor or ONN if symptoms worsen, do not improve, or any other symptoms develop. Agrees to seek emergency care if pt believes is needed, including for increased dizziness, depression, or any thoughts of SI.
-**Important:** I cannot provide medical advice or treatment recommendations. Please call your oncology team to confirm what's appropriate for your specific situation."""
-    def chat(self, message, history):
-        """Main chat interface for OncoLife Assistant"""
-        if not message.strip():
-            return "Please describe your symptoms or concerns."
-        # Convert history to the format expected by generate_oncolife_response
-        conversation_history = []
-        for user_msg, assistant_msg in history:
-            conversation_history.append({
-                "user": user_msg,
-                "assistant": assistant_msg
-            })
-        # Generate response using OncoLife protocol
-        response = self.generate_oncolife_response(message, conversation_history)
-        return response
-# Create interface
-assistant = OncoLifeAssistant()
-interface = gr.ChatInterface(
-    fn=assistant.chat,
-    title="🏥 OncoLife Symptom & Triage Assistant",
-    description="I'm here to help assess your symptoms and determine if you need to contact your care team. Please describe your symptoms or concerns.",
-    examples=[
-        ["I'm feeling nauseous and tired"],
-        ["I have a fever of 101"],
-        ["My neuropathy is getting worse"],
-        ["I'm having trouble eating"],
-        ["I feel dizzy and lightheaded"]
-    ],
-    theme=gr.themes.Soft()
-)
-if __name__ == "__main__":
-    print("=" * 60)
-    print("OncoLife Symptom & Triage Assistant")
-    print("=" * 60)
-    interface.launch(server_name="0.0.0.0", server_port=7860)