import os import copy from surya.detection import batch_text_detection from surya.input.load import load_from_folder, load_from_file from surya.layout import batch_layout_detection from surya.model.detection.model import load_model as load_det_model, load_processor as load_det_processor from surya.model.ordering.model import load_model from surya.model.ordering.processor import load_processor from surya.ordering import batch_ordering from surya.postprocessing.heatmap import draw_polys_on_image from surya.settings import settings def main(input_path, max_pages=None): model = load_model() processor = load_processor() layout_model = load_det_model(checkpoint=settings.LAYOUT_MODEL_CHECKPOINT) layout_processor = load_det_processor(checkpoint=settings.LAYOUT_MODEL_CHECKPOINT) det_model = load_det_model() det_processor = load_det_processor() if os.path.isdir(input_path): images, names = load_from_folder(input_path, max_pages) else: images, names = load_from_file(input_path, max_pages) line_predictions = batch_text_detection(images, det_model, det_processor) layout_predictions = batch_layout_detection(images, layout_model, layout_processor, line_predictions) bboxes = [] for layout_pred in layout_predictions: bbox = [l.bbox for l in layout_pred.bboxes] bboxes.append(bbox) order_predictions = batch_ordering(images, bboxes, model, processor) for idx, (image, layout_pred, order_pred, name) in enumerate(zip(images, layout_predictions, order_predictions, names)): polys = [l.polygon for l in order_pred.bboxes] labels = [str(l.position) for l in order_pred.bboxes] bbox_image = draw_polys_on_image(polys, copy.deepcopy(image), labels=labels, label_font_size=20) return bbox_image