LETR / app.py
z-uo's picture
add raw text output
b4d55e3
raw
history blame
2.31 kB
from PIL import Image, ImageDraw
import torch
from torchvision import transforms
import torch.nn.functional as F
import gradio as gr
# import sys
# sys.path.insert(0, './')
from test import create_letr, get_lines_and_draw
from models.preprocessing import *
from models.misc import nested_tensor_from_tensor_list
model = create_letr('resnet50/checkpoint0024.pth')
model101 = create_letr('resnet101/checkpoint0024.pth')
# PREPARE PREPROCESSING
# transform_test = transforms.Compose([
# transforms.Resize((test_size)),
# transforms.ToTensor(),
# transforms.Normalize([0.538, 0.494, 0.453], [0.257, 0.263, 0.273]),
# ])
normalize = Compose([
ToTensor(),
Normalize([0.538, 0.494, 0.453], [0.257, 0.263, 0.273]),
Resize([256]),
])
normalize_512 = Compose([
ToTensor(),
Normalize([0.538, 0.494, 0.453], [0.257, 0.263, 0.273]),
Resize([512]),
])
normalize_1100 = Compose([
ToTensor(),
Normalize([0.538, 0.494, 0.453], [0.257, 0.263, 0.273]),
Resize([1100]),
])
def predict(inp, size, model_name):
image = Image.fromarray(inp.astype('uint8'), 'RGB')
h, w = image.height, image.width
orig_size = torch.as_tensor([int(h), int(w)])
if size == '1100':
img = normalize_1100(image)
elif size == '512':
img = normalize_512(image)
else:
img = normalize(image)
inputs = nested_tensor_from_tensor_list([img])
with torch.no_grad():
if model_name == 'resnet101':
outputs = model101(inputs)[0]
else:
outputs = model(inputs)[0]
lines = get_lines_and_draw(image, outputs, orig_size)
return image, str(lines)
inputs = [
gr.inputs.Image(),
gr.inputs.Radio(["256", "512", "1100"]),
gr.inputs.Radio(["resnet50", "resnet101"]),
]
outputs = [
gr.outputs.Image(),
gr.outputs.Textbox()
]
gr.Interface(
fn=predict,
inputs=inputs,
outputs=outputs,
examples=[
["demo.png", '256', "resnet50"],
["tappeto-per-calibrazione.jpg", '256', "resnet50"]
],
title="LETR: Line Segment Detection Using Transformers without Edges",
description="It is an end-to-end line segment detection algorithm using Transformers [published on CVPR 2021](https://github.com/mlpc-ucsd/LETR)."
).launch()