Spaces:
Runtime error
Runtime error
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved. | |
# | |
# Licensed under the Apache License, Version 2.0 (the "License"); | |
# you may not use this file except in compliance with the License. | |
# You may obtain a copy of the License at | |
# | |
# http://www.apache.org/licenses/LICENSE-2.0 | |
# | |
# Unless required by applicable law or agreed to in writing, software | |
# distributed under the License is distributed on an "AS IS" BASIS, | |
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
# See the License for the specific language governing permissions and | |
# limitations under the License. | |
from __future__ import absolute_import | |
from __future__ import division | |
from __future__ import print_function | |
import numpy as np | |
import os | |
import sys | |
__dir__ = os.path.dirname(os.path.abspath(__file__)) | |
sys.path.append(__dir__) | |
sys.path.insert(0, os.path.abspath(os.path.join(__dir__, '..'))) | |
os.environ["FLAGS_allocator_strategy"] = 'auto_growth' | |
import cv2 | |
import json | |
import paddle | |
from ppocr.data import create_operators, transform | |
from ppocr.modeling.architectures import build_model | |
from ppocr.postprocess import build_post_process | |
from ppocr.utils.save_load import load_model | |
from ppocr.utils.utility import get_image_file_list | |
import tools.program as program | |
from PIL import Image, ImageDraw, ImageFont | |
import math | |
def draw_e2e_res_for_chinese(image, | |
boxes, | |
txts, | |
config, | |
img_name, | |
font_path="./doc/simfang.ttf"): | |
h, w = image.height, image.width | |
img_left = image.copy() | |
img_right = Image.new('RGB', (w, h), (255, 255, 255)) | |
import random | |
random.seed(0) | |
draw_left = ImageDraw.Draw(img_left) | |
draw_right = ImageDraw.Draw(img_right) | |
for idx, (box, txt) in enumerate(zip(boxes, txts)): | |
box = np.array(box) | |
box = [tuple(x) for x in box] | |
color = (random.randint(0, 255), random.randint(0, 255), | |
random.randint(0, 255)) | |
draw_left.polygon(box, fill=color) | |
draw_right.polygon(box, outline=color) | |
font = ImageFont.truetype(font_path, 15, encoding="utf-8") | |
draw_right.text([box[0][0], box[0][1]], txt, fill=(0, 0, 0), font=font) | |
img_left = Image.blend(image, img_left, 0.5) | |
img_show = Image.new('RGB', (w * 2, h), (255, 255, 255)) | |
img_show.paste(img_left, (0, 0, w, h)) | |
img_show.paste(img_right, (w, 0, w * 2, h)) | |
save_e2e_path = os.path.dirname(config['Global'][ | |
'save_res_path']) + "/e2e_results/" | |
if not os.path.exists(save_e2e_path): | |
os.makedirs(save_e2e_path) | |
save_path = os.path.join(save_e2e_path, os.path.basename(img_name)) | |
cv2.imwrite(save_path, np.array(img_show)[:, :, ::-1]) | |
logger.info("The e2e Image saved in {}".format(save_path)) | |
def draw_e2e_res(dt_boxes, strs, config, img, img_name): | |
if len(dt_boxes) > 0: | |
src_im = img | |
for box, str in zip(dt_boxes, strs): | |
box = box.astype(np.int32).reshape((-1, 1, 2)) | |
cv2.polylines(src_im, [box], True, color=(255, 255, 0), thickness=2) | |
cv2.putText( | |
src_im, | |
str, | |
org=(int(box[0, 0, 0]), int(box[0, 0, 1])), | |
fontFace=cv2.FONT_HERSHEY_COMPLEX, | |
fontScale=0.7, | |
color=(0, 255, 0), | |
thickness=1) | |
save_det_path = os.path.dirname(config['Global'][ | |
'save_res_path']) + "/e2e_results/" | |
if not os.path.exists(save_det_path): | |
os.makedirs(save_det_path) | |
save_path = os.path.join(save_det_path, os.path.basename(img_name)) | |
cv2.imwrite(save_path, src_im) | |
logger.info("The e2e Image saved in {}".format(save_path)) | |
def main(): | |
global_config = config['Global'] | |
# build model | |
model = build_model(config['Architecture']) | |
load_model(config, model) | |
# build post process | |
post_process_class = build_post_process(config['PostProcess'], | |
global_config) | |
# create data ops | |
transforms = [] | |
for op in config['Eval']['dataset']['transforms']: | |
op_name = list(op)[0] | |
if 'Label' in op_name: | |
continue | |
elif op_name == 'KeepKeys': | |
op[op_name]['keep_keys'] = ['image', 'shape'] | |
transforms.append(op) | |
ops = create_operators(transforms, global_config) | |
save_res_path = config['Global']['save_res_path'] | |
if not os.path.exists(os.path.dirname(save_res_path)): | |
os.makedirs(os.path.dirname(save_res_path)) | |
model.eval() | |
with open(save_res_path, "wb") as fout: | |
for file in get_image_file_list(config['Global']['infer_img']): | |
logger.info("infer_img: {}".format(file)) | |
with open(file, 'rb') as f: | |
img = f.read() | |
data = {'image': img} | |
batch = transform(data, ops) | |
images = np.expand_dims(batch[0], axis=0) | |
shape_list = np.expand_dims(batch[1], axis=0) | |
images = paddle.to_tensor(images) | |
preds = model(images) | |
post_result = post_process_class(preds, shape_list) | |
points, strs = post_result['points'], post_result['texts'] | |
# write result | |
dt_boxes_json = [] | |
for poly, str in zip(points, strs): | |
tmp_json = {"transcription": str} | |
tmp_json['points'] = poly.tolist() | |
dt_boxes_json.append(tmp_json) | |
otstr = file + "\t" + json.dumps(dt_boxes_json) + "\n" | |
fout.write(otstr.encode()) | |
src_img = cv2.imread(file) | |
if global_config['infer_visual_type'] == 'EN': | |
draw_e2e_res(points, strs, config, src_img, file) | |
elif global_config['infer_visual_type'] == 'CN': | |
src_img = Image.fromarray( | |
cv2.cvtColor(src_img, cv2.COLOR_BGR2RGB)) | |
draw_e2e_res_for_chinese( | |
src_img, | |
points, | |
strs, | |
config, | |
file, | |
font_path="./doc/fonts/simfang.ttf") | |
logger.info("success!") | |
if __name__ == '__main__': | |
config, device, logger, vdl_writer = program.preprocess() | |
main() | |