mashaelalbu commited on
Commit
c7898d4
·
verified ·
1 Parent(s): 6587984

Update app/utils.py

Browse files
Files changed (1) hide show
  1. app/utils.py +13 -14
app/utils.py CHANGED
@@ -4,9 +4,7 @@ from transformers import AutoModel, AutoTokenizer
4
  from PIL import Image, ImageEnhance, ImageFilter
5
  import torch
6
  import logging
7
- import shutil
8
- import os
9
-
10
 
11
  logger = logging.getLogger(__name__)
12
 
@@ -22,19 +20,21 @@ class OCRModel:
22
  def initialize(self):
23
  try:
24
  logger.info("Initializing OCR model...")
25
- # Try loading with use_fast=False if the fast tokenizer fails
 
26
  try:
 
27
  self.tokenizer = AutoTokenizer.from_pretrained(
28
- 'stepfun-ai/GOT-OCR-2.0-hf',
29
  trust_remote_code=True,
30
- use_fast=False # Try with slow tokenizer
31
  )
32
  except Exception as e:
33
- logger.warning(f"Fast tokenizer failed, trying alternative: {str(e)}")
34
- self.tokenizer = AutoTokenizer.from_pretrained(
35
- 'stepfun-ai/GOT-OCR-2.0-hf',
36
- trust_remote_code=True,
37
- use_fast=False
38
  )
39
 
40
  self.model = AutoModel.from_pretrained(
@@ -42,8 +42,7 @@ class OCRModel:
42
  trust_remote_code=True,
43
  low_cpu_mem_usage=True,
44
  device_map='auto',
45
- use_safetensors=True,
46
- pad_token_id=self.tokenizer.eos_token_id
47
  )
48
 
49
  self.device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -54,7 +53,7 @@ class OCRModel:
54
  except Exception as e:
55
  logger.error(f"Error initializing model: {str(e)}", exc_info=True)
56
  raise
57
-
58
  def preprocess_image(self, image):
59
  """Image preprocessing to improve text recognition quality"""
60
  try:
 
4
  from PIL import Image, ImageEnhance, ImageFilter
5
  import torch
6
  import logging
7
+ from transformers import BertTokenizer
 
 
8
 
9
  logger = logging.getLogger(__name__)
10
 
 
20
  def initialize(self):
21
  try:
22
  logger.info("Initializing OCR model...")
23
+
24
+ # Try different tokenizer approaches
25
  try:
26
+ # First try with the standard approach
27
  self.tokenizer = AutoTokenizer.from_pretrained(
28
+ 'stepfun-ai/GOT-OCR-2.0-hf',
29
  trust_remote_code=True,
30
+ use_fast=False
31
  )
32
  except Exception as e:
33
+ logger.warning(f"Standard tokenizer failed, trying BertTokenizer: {str(e)}")
34
+ # Fall back to BertTokenizer if AutoTokenizer fails
35
+ self.tokenizer = BertTokenizer.from_pretrained(
36
+ 'stepfun-ai/GOT-OCR-2.0-hf',
37
+ trust_remote_code=True
38
  )
39
 
40
  self.model = AutoModel.from_pretrained(
 
42
  trust_remote_code=True,
43
  low_cpu_mem_usage=True,
44
  device_map='auto',
45
+ use_safetensors=True
 
46
  )
47
 
48
  self.device = "cuda" if torch.cuda.is_available() else "cpu"
 
53
  except Exception as e:
54
  logger.error(f"Error initializing model: {str(e)}", exc_info=True)
55
  raise
56
+
57
  def preprocess_image(self, image):
58
  """Image preprocessing to improve text recognition quality"""
59
  try: