Spaces:
Running
Running
File size: 1,961 Bytes
d863531 b6a4ee3 d863531 b6a4ee3 d863531 b6a4ee3 d863531 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 |
from PIL import Image, ImageDraw
import torch.nn.functional as F
import torch
from models.letr import build
from models.misc import nested_tensor_from_tensor_list
from models.preprocessing import Compose, ToTensor, Resize, Normalize
def create_letr(path):
# obtain checkpoints
checkpoint = torch.load(path, map_location='cpu')
# load model
args = checkpoint['args']
args.device = 'cpu'
model, _, _ = build(args)
model.load_state_dict(checkpoint['model'])
model.eval()
return model
def draw_fig(image, outputs, orig_size):
# find lines
out_logits, out_line = outputs['pred_logits'], outputs['pred_lines']
prob = F.softmax(out_logits, -1)
scores, labels = prob[..., :-1].max(-1)
img_h, img_w = orig_size.unbind(0)
scale_fct = torch.unsqueeze(torch.stack(
[img_w, img_h, img_w, img_h], dim=0), dim=0)
lines = out_line * scale_fct[:, None, :]
lines = lines.view(1000, 2, 2)
lines = lines.flip([-1]) # this is yxyx format
scores = scores.detach().numpy()
keep = scores >= 0.7
keep = keep.squeeze()
lines = lines[keep]
if len(lines) != 0:
lines = lines.reshape(lines.shape[0], -1)
# draw lines
draw = ImageDraw.Draw(image)
for tp_id, line in enumerate(lines):
y1, x1, y2, x2 = line
draw.line((x1, y1, x2, y2), fill=500)
if __name__ == '__main__':
model = create_letr('resnet50/checkpoint0024.pth')
test_size = 256
normalize = Compose([
ToTensor(),
Normalize([0.538, 0.494, 0.453], [0.257, 0.263, 0.273]),
Resize([test_size]),
])
image = Image.open('demo.png')
h, w = image.height, image.width
orig_size = torch.as_tensor([int(h), int(w)])
img = normalize(image)
inputs = nested_tensor_from_tensor_list([img])
with torch.no_grad():
outputs = model(inputs)[0]
draw_fig(image, outputs, orig_size)
image.save('output.png') |