Spaces:

0llheaven
/

FT_Llama

Runtime error

App Files Files Community

0llheaven commited on Dec 6, 2024

Commit

bd9df5d

verified ·

1 Parent(s): b250b49

Update app.py

Browse files

Files changed (1) hide show

app.py +114 -68

app.py CHANGED Viewed

@@ -1,87 +1,133 @@
-import spaces
-import gradio as gr
 import torch
 from PIL import Image
-from transformers import AutoModelForImageTextToText, MllamaForConditionalGeneration, AutoProcessor
 from transformers import TextStreamer
-from torchvision.transforms import Resize
-from unsloth import FastVisionModel
-# Define the model and processor
-model_id = "0llheaven/Llama-3.2-11B-Vision-Radiology-mini"
-device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-print(f"Using device: {device}")
-# device = "cuda" if torch.cuda.is_available() else "cpu"
-model = AutoModelForImageTextToText.from_pretrained(
-    model_id,
-    # load_in_4bit=True,
-    torch_dtype=torch.float32 if device.type == "cpu" else torch.bfloat16,
-    device_map=device,
-).to(device)
-# if device.type == "cuda":
-#     model.gradient_checkpointing_enable()
-model.gradient_checkpointing_enable()
-processor = AutoProcessor.from_pretrained(model_id)
-# @spaces.GPU(duration=120)
-# Function to process the image and generate the description
-def generate_description(image: Image.Image, instruction: str):
-    FastVisionModel.for_inference(model)
-    print("กำลังโหลด tokenizer...")
-    base_model, tokenizer = FastVisionModel.from_pretrained(
-        "unsloth/Llama-3.2-11B-Vision-Instruct",
-        # load_in_4bit = True,
-        use_gradient_checkpointing = "unsloth",
-    )
-    image = image.convert("RGB")
-    # image = Resize((224, 224))(image)
-    # Create the message to pass to the model
-    instruction = "You are an expert radiographer. Describe accurately what you see in this image."
-    messages = [
-        {"role": "user", "content": [
             {"type": "image"},
             {"type": "text", "text": instruction}
-        ]}
-    ]
-    input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True)
-    # input_text = processor.apply_chat_template(messages, add_generation_prompt=True)
-    inputs = tokenizer(
-        image,
-        input_text,
-        add_special_tokens=False,
-        return_tensors="pt"
-    ).to(device)
-    # Generate the output from the model
-    # output = model.generate(**inputs, max_new_tokens=256)
-    text_streamer = TextStreamer(tokenizer, skip_prompt=True)
-    outputs = model.generate(
-            **inputs,
             streamer=text_streamer,
             max_new_tokens=256,
             use_cache=True,
             temperature=1.5,
             min_p=0.1
         )
-    return tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
-# Define Gradio interface
-interface = gr.Interface(
-    fn=generate_description,
-    inputs=gr.Image(type="pil", label="Upload an Image"),
-    outputs=gr.Textbox(label="Generated Description"),
-    # live=True,
-    title="Radiology Image Description Generator",
-    description="Upload an image and provide an instruction to generate a description using a vision-language model."
-)
-# Launch the interface
-interface.launch()

+import os
+from unsloth import FastVisionModel
 import torch
 from PIL import Image
+from datasets import load_dataset
 from transformers import TextStreamer
+import matplotlib.pyplot as plt
+import gradio as gr
+# Load the model
+model, tokenizer = FastVisionModel.from_pretrained(
+    "0llheaven/Llama-3.2-11B-Vision-Radiology-mini",
+    load_in_4bit=True,
+    use_gradient_checkpointing="unsloth",
+)
+# เปลี่ยนโหมดของโมเดลเป็นสำหรับ inference
+FastVisionModel.for_inference(model)
+# ตัวแปรสำหรับแคช
+cached_image = None
+cached_response = None
+# ฟังก์ชันประมวลผลภาพและสร้างคำอธิบาย
+def predict_radiology_description(image, instruction):
+    global cached_image, cached_response
+    try:
+        current_image_tensor = torch.tensor(image.getdata())
+        # ตรวจสอบว่าภาพเหมือนเดิมและข้อความเหมือนเดิมหรือไม่
+        if cached_image is not None and torch.equal(cached_image, current_image_tensor):
+            # ใช้ cached_response กับ text ใหม่
+            return cached_response
+        # เตรียมข้อความในรูปแบบที่โมเดลรองรับ
+        messages = [{"role": "user", "content": [
             {"type": "image"},
             {"type": "text", "text": instruction}
+        ]}]
+        input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True)
+        # เตรียม input สำหรับโมเดล
+        inputs = tokenizer(
+            image,
+            input_text,
+            add_special_tokens=False,
+            return_tensors="pt",
+        ).to("cuda")
+        # ใช้ TextStreamer สำหรับการพยากรณ์
+        text_streamer = TextStreamer(tokenizer, skip_prompt=True)
+        # ทำนายข้อความ
+        output_ids = model.generate(
+            **inputs,
             streamer=text_streamer,
             max_new_tokens=256,
             use_cache=True,
             temperature=1.5,
             min_p=0.1
         )
+        # แปลงข้อความที่สร้างเป็นผลลัพธ์
+        generated_text = tokenizer.decode(output_ids[0], skip_special_tokens=True)
+        cached_image = current_image_tensor  # แคชภาพเป็น Tensor
+        cached_response = generated_text.replace("assistant", "\n\nAssistant").strip()
+        return cached_response
+    except Exception as e:
+        return f"Error: {str(e)}"
+# ฟังก์ชัน ChatBot
+def chat_process(image, instruction, history=None):
+    if history is None:
+        history = []
+    # ประมวลผลภาพและคำสั่ง
+    response = predict_radiology_description(image, instruction)
+    # อัปเดตประวัติ
+    history.append((instruction, response))
+    return history, history
+import warnings
+warnings.filterwarnings("ignore", category=UserWarning, module="gradio.helpers")
+# UI ของ Gradio
+with gr.Blocks() as demo:
+    gr.Markdown("# 🩻 Radiology Image ChatBot")
+    gr.Markdown("Upload a radiology image and provide an instruction for the AI to describe the findings.")
+    gr.Markdown("Example instruction : You are an expert radiographer. Describe accurately what you see in this image.")
+    with gr.Row():
+        with gr.Column():
+            # อัปโหลดรูปภาพ
+            image_input = gr.Image(type="pil", label="Upload Radiology Image")
+            # ป้อนคำสั่ง (instruction)
+            instruction_input = gr.Textbox(
+                label="Instruction",
+                value="You are an expert radiographer. Describe accurately what you see in this image.",
+                placeholder="Provide specific instructions..."
+            )
+        with gr.Column():
+            # แสดงประวัติ Chat
+            chatbot = gr.Chatbot(label="Chat History")
+    with gr.Row():
+        clear_btn = gr.Button("Clear")
+        submit_btn = gr.Button("Submit")
+    # การทำงานของปุ่ม Submit พร้อมล้างเฉพาะข้อความใน instruction_input
+    submit_btn.click(
+        lambda image, instruction, history: (
+            *chat_process(image, instruction, history),
+            image,  # รีเซ็ตค่า image_input
+            ""
+        ),
+        inputs=[image_input, instruction_input, chatbot],
+        outputs=[chatbot, chatbot, image_input, instruction_input]
+    )
+    # การทำงานของปุ่ม Clear
+    clear_btn.click(
+        lambda: (None, None, None, None),
+        inputs=[],
+        outputs=[chatbot, chatbot, image_input, instruction_input]
+    )
+# รันแอป
+demo.launch(debug=True)