Update handler.py
Browse files- handler.py +3 -3
handler.py
CHANGED
@@ -6,18 +6,18 @@ class ModelHandler:
|
|
6 |
def __init__(self):
|
7 |
# Load the model and tokenizer with appropriate weights
|
8 |
self.model = AutoModel.from_pretrained(
|
9 |
-
'
|
10 |
trust_remote_code=True,
|
11 |
attn_implementation='sdpa',
|
12 |
torch_dtype=torch.bfloat16
|
13 |
).eval().cuda()
|
14 |
|
15 |
-
self.tokenizer = AutoTokenizer.from_pretrained('
|
16 |
|
17 |
def preprocess(self, inputs):
|
18 |
# Preprocess image input
|
19 |
image = Image.open(inputs['image'].file).convert('RGB')
|
20 |
-
question = inputs.get("question", "
|
21 |
msgs = [{'role': 'user', 'content': [image, question]}]
|
22 |
return msgs
|
23 |
|
|
|
6 |
def __init__(self):
|
7 |
# Load the model and tokenizer with appropriate weights
|
8 |
self.model = AutoModel.from_pretrained(
|
9 |
+
'fredaddy/MiniCPM-V-2_6',
|
10 |
trust_remote_code=True,
|
11 |
attn_implementation='sdpa',
|
12 |
torch_dtype=torch.bfloat16
|
13 |
).eval().cuda()
|
14 |
|
15 |
+
self.tokenizer = AutoTokenizer.from_pretrained('fredaddy/MiniCPM-V-2_6', trust_remote_code=True)
|
16 |
|
17 |
def preprocess(self, inputs):
|
18 |
# Preprocess image input
|
19 |
image = Image.open(inputs['image'].file).convert('RGB')
|
20 |
+
question = inputs.get("question", "Extract all data in the image. Be extremely careful to ensure that you don't miss anything. It's imperative that you extract and digitize everything on that page.")
|
21 |
msgs = [{'role': 'user', 'content': [image, question]}]
|
22 |
return msgs
|
23 |
|