Spaces:

0llheaven
/

FT_Llama

Runtime error

App Files Files Community

0llheaven commited on Dec 4, 2024

Commit

ddfe551

verified ·

1 Parent(s): 0a05d96

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -6

app.py CHANGED Viewed

@@ -1,15 +1,16 @@
 import gradio as gr
 import torch
 from PIL import Image
-from transformers import MllamaForConditionalGeneration, AutoProcessor
 from transformers import TextStreamer
 from torchvision.transforms import Resize
 # Define the model and processor
 model_id = "0llheaven/Llama-3.2-11B-Vision-Radiology-mini"
 # device = "cuda" if torch.cuda.is_available() else "cpu"
-model = MllamaForConditionalGeneration.from_pretrained(
     model_id,
     # load_in_4bit=True,
     torch_dtype=torch.bfloat16,
@@ -20,6 +21,14 @@ model.gradient_checkpointing_enable()
 processor = AutoProcessor.from_pretrained(model_id)
 # Function to process the image and generate the description
 def generate_description(image: Image.Image, instruction: str):
     image = image.convert("RGB")
@@ -34,8 +43,9 @@ def generate_description(image: Image.Image, instruction: str):
         ]}
     ]
-    input_text = processor.apply_chat_template(messages, add_generation_prompt=True)
-    inputs = processor(
         image,
         input_text,
         add_special_tokens=False,
@@ -43,8 +53,17 @@ def generate_description(image: Image.Image, instruction: str):
     ).to(model.device)
     # Generate the output from the model
-    output = model.generate(**inputs, max_new_tokens=256)
-    return processor.decode(output[0])
 # Define Gradio interface
 interface = gr.Interface(

 import gradio as gr
 import torch
 from PIL import Image
+from transformers import AutoModelForImageTextToText, MllamaForConditionalGeneration, AutoProcessor
 from transformers import TextStreamer
 from torchvision.transforms import Resize
+from unsloth import FastVisionModel
 # Define the model and processor
 model_id = "0llheaven/Llama-3.2-11B-Vision-Radiology-mini"
 # device = "cuda" if torch.cuda.is_available() else "cpu"
+model = AutoModelForImageTextToText.from_pretrained(
     model_id,
     # load_in_4bit=True,
     torch_dtype=torch.bfloat16,
 processor = AutoProcessor.from_pretrained(model_id)
+FastVisionModel.for_inference(model)
+print("กำลังโหลด tokenizer...")
+base_model, tokenizer = FastVisionModel.from_pretrained(
+    "unsloth/Llama-3.2-11B-Vision-Instruct",
+    # load_in_4bit = True,
+    use_gradient_checkpointing = "unsloth",
+)
 # Function to process the image and generate the description
 def generate_description(image: Image.Image, instruction: str):
     image = image.convert("RGB")
         ]}
     ]
+    input_text = tokenizer.apply_chat_template(messages, add_generation_prompt=True)
+    # input_text = processor.apply_chat_template(messages, add_generation_prompt=True)
+    inputs = tokenizer(
         image,
         input_text,
         add_special_tokens=False,
     ).to(model.device)
     # Generate the output from the model
+    # output = model.generate(**inputs, max_new_tokens=256)
+    text_streamer = TextStreamer(tokenizer, skip_prompt=True)
+    outputs = model.generate(
+            **inputs,
+            streamer=text_streamer,
+            max_new_tokens=256,
+            use_cache=True,
+            temperature=1.5,
+            min_p=0.1
+        )
+    return tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
 # Define Gradio interface
 interface = gr.Interface(