Spaces:

nafisneehal
/

trialbrain-baseline-features-chat

Running on Zero

App Files Files Community

nafisneehal commited on Nov 15, 2024

Commit

064f6be

verified ·

1 Parent(s): 5f89689

Update app.py

Browse files

Files changed (1) hide show

app.py +71 -60

app.py CHANGED Viewed

@@ -1,63 +1,75 @@
 import gradio as gr
 import torch
-from transformers import AutoModelForCausalLM, AutoTokenizer, GenerationConfig
-import spaces
-# Initialize device
-device = "cuda" if torch.cuda.is_available() else "cpu"
-# Load model names from an external file
-with open("models.txt", "r") as f:
-    model_list = [line.strip() for line in f.readlines()]
-# Define variables for the model and tokenizer
-model = None
-tokenizer = None
-def load_model(model_name):
-    global model, tokenizer
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-    # Clear previous model from memory
-    if model:
-        del model
-        torch.cuda.empty_cache()
-    try:
-        # Load the specified model and move it to the device
-        model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16).to(device)
-        tokenizer = AutoTokenizer.from_pretrained(model_name)
-        print(f"Loaded model: {model_name}")
-    except ValueError as e:
-        print(f"Failed to load model '{model_name}': {e}")
-        model = None  # Reset if loading fails
-        tokenizer = None
-# Load the initial model
-current_model_name = model_list[0]
-load_model(current_model_name)
 # Default values for system and user input
-test_instruction_string = """You are a helpful assistant with experience in the clinical domain..."""
-test_input_string = """<Title:>Vinorelbine in Treating Patients With Advanced Solid Tumors..."""
-alpaca_prompt = """Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.
-### Instruction:
-{}
-### Input:
-{}
-### Response:
-{}"""
-@spaces.GPU
-def generate_response(system_instruction, user_input):
-    # Check if model is loaded
-    if model is None:
-        return "Model is not loaded. Please select a compatible model."
-    # Prepare input and move to the appropriate device
-    device = model.device
-    inputs = tokenizer([alpaca_prompt.format(system_instruction, user_input, "")], return_tensors="pt").to(device)
     # Define generation configuration
     meta_config = {
@@ -70,7 +82,7 @@ def generate_response(system_instruction, user_input):
     }
     generation_config = GenerationConfig(**meta_config)
-    # Generate response with error handling for device mismatch issues
     with torch.no_grad():
         outputs = model.generate(**inputs, generation_config=generation_config)
         decoded_output = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]
@@ -78,12 +90,12 @@ def generate_response(system_instruction, user_input):
     return assistant_response
 # Gradio interface setup
 with gr.Blocks() as demo:
-    gr.Markdown("# Clinical Trial Chatbot with Model Selection")
     with gr.Row():
         with gr.Column():
             system_instruction = gr.Textbox(
                 value=test_instruction_string,
@@ -97,15 +109,14 @@ with gr.Blocks() as demo:
             )
             submit_btn = gr.Button("Submit")
         with gr.Column():
-            model_dropdown = gr.Dropdown(choices=model_list, value=current_model_name, label="Select Model")
             response_display = gr.Textbox(
                 label="Bot Response", interactive=False, placeholder="Response will appear here."
             )
-    # Link model selection and submit button to functions
-    model_dropdown.change(lambda m: load_model(m), inputs=model_dropdown, outputs=[])
     submit_btn.click(generate_response, [system_instruction, user_input], response_display)
 # Launch the app with share=True to make it public
-demo.launch(share=True)

 import gradio as gr
 import torch
+from peft import AutoPeftModelForCausalLM
+from transformers import AutoTokenizer, GenerationConfig
+# Load model and tokenizer
+model_name = "nafisneehal/Llama-3.2-3B-bnb-4bit-finetuned-TrialBrain-BaselineFeatures-it"
+load_in_4bit = True  # Set this to True as per your code requirements
+# Initialize model and tokenizer
+model = AutoPeftModelForCausalLM.from_pretrained(model_name, load_in_4bit=load_in_4bit)
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+# Set device
+device = "cuda" if torch.cuda.is_available() else "cpu"
+model.to(device)
 # Default values for system and user input
+test_instruction_string = """
+You're a clinical trial expert. For each trial query, list probable baseline features (each in backticks and comma-separated).
+Baseline features are demographic characteristics used in primary outcome analysis, often shown by group in clinical publications.
+"""
+test_input_string = """
+<Title:>Vinorelbine in Treating Patients With Advanced Solid Tumors That Have Not Responded to Treatment and Liver Dysfunction <BriefSummary:>RATIONALE: Drugs used in chemotherapy, such as vinorelbine, work in different ways to stop the growth of tumor cells, either by killing the cells or by stopping them from dividing.
+PURPOSE: This pilot trial is studying the side effects and best dose of vinorelbine in treating patients with advanced solid tumors that have not responded to treatment and liver dysfunction. <EligibilityCriteria:>DISEASE CHARACTERISTICS:
+* Histologically confirmed advanced solid tumor
+  * Any histology allowed
+* Refractory to standard therapy OR no standard therapy exists
+  * Previously untreated non-small cell lung cancer allowed, provided abnormal liver function is present, defined as moderate (group 3) or severe (group 4)
+* Measurable disease not required
+  * Present measurable disease requires baseline measurements within 4 weeks of study entry
+* Patients with acute hepatitis from viral or drug etiologies should recover to a stable baseline prior to study therapy
+* History of brain metastasis allowed, provided the following criteria are met:
+  * Metastasis has been controlled by radiotherapy or surgery
+  * Patient is not currently on corticosteroids
+  * Neurologic status is stable
+PATIENT CHARACTERISTICS:
+* Karnofsky performance status 70-100%
+* Life expectancy ≥ 2 months
+* ANC = 1,500/mm³
+* Platelet count = 100,000/mm³
+* Hemoglobin = 10 g/dL (transfusion to this level allowed)
+* Creatinine \< 1.5 mg/dL OR creatinine clearance \> 60 mL/ min
+* Patients with EKG evidence of first- or second-degree AV block or left or right bundle branch block are ineligible for the lidocaine bolus, but may otherwise be treated on this protocol
+* Not pregnant or nursing
+* Negative pregnancy test
+* Fertile patients must use effective contraception
+* No concurrent illness (e.g., cardiovascular, pulmonary, or central nervous system) that is poorly controlled or of such severity that the investigator deems unwise to enter the patient on protocol
+* Must have ability to comply with study treatment and required tests
+* Obstructive jaundice requires a drainage procedure prior to study treatment
+PRIOR CONCURRENT THERAPY:
+* See Disease Characteristics
+* Recovered from prior therapy
+* At least 3 weeks since prior chemotherapy (6 weeks for mitomycin or nitrosourea therapy)
+* No prior radiotherapy to \> 30% of the bone marrow or more than standard adjuvant pelvic radiotherapy for rectal cancer <Conditions:>Lung Cancer, Unspecified Adult Solid Tumor, Protocol Specific,  <Interventions:>indocyanine green, lidocaine, vinorelbine ditartrate, high performance liquid chromatography, intracellular fluorescence polarization analysis, liquid chromatography, mass spectrometry, pharmacological study <StudyType:>INTERVENTIONAL <PrimaryOutcomes:>Area Under the Curve, Number of Participants With Grade 3 and 4 Toxicities <OverallStatus:>COMPLETED
+"""
+# Function to generate response
+def generate_response(system_instruction, user_input):
+    # Prepare the input and move it to the correct device
+    inputs = tokenizer([f"### Instruction:\n{system_instruction}\n### Input:\n{user_input}\n### Response:\n"], return_tensors="pt").to(device)
     # Define generation configuration
     meta_config = {
     }
     generation_config = GenerationConfig(**meta_config)
+    # Generate response
     with torch.no_grad():
         outputs = model.generate(**inputs, generation_config=generation_config)
         decoded_output = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]
     return assistant_response
 # Gradio interface setup
 with gr.Blocks() as demo:
+    gr.Markdown("# Clinical Trial Chatbot")
     with gr.Row():
+        # Left column for user inputs
         with gr.Column():
             system_instruction = gr.Textbox(
                 value=test_instruction_string,
             )
             submit_btn = gr.Button("Submit")
+        # Right column for bot response
         with gr.Column():
             response_display = gr.Textbox(
                 label="Bot Response", interactive=False, placeholder="Response will appear here."
             )
+    # Link submit button to the function
     submit_btn.click(generate_response, [system_instruction, user_input], response_display)
 # Launch the app with share=True to make it public
+demo.launch()