Hunyuan3D-1 / svrm /utils /img_utils.py
Huiwenshi's picture
Upload folder using huggingface_hub
e3e5f9e verified
raw
history blame
7.43 kB
import os
import cv2
import numpy as np
from skimage.metrics import hausdorff_distance
from matplotlib import pyplot as plt
def get_input_imgs_path(input_data_dir):
path = {}
names = ['000', 'ori_000']
for name in names:
jpg_path = os.path.join(input_data_dir, f"{name}.jpg")
png_path = os.path.join(input_data_dir, f"{name}.png")
if os.path.exists(jpg_path):
path[name] = jpg_path
elif os.path.exists(png_path):
path[name] = png_path
return path
def rgba_to_rgb(image, bg_color=[255, 255, 255]):
if image.shape[-1] == 3: return image
rgba = image.astype(float)
rgb = rgba[:, :, :3].copy()
alpha = rgba[:, :, 3] / 255.0
bg = np.ones((image.shape[0], image.shape[1], 3), dtype=np.float32)
bg = bg * np.array(bg_color, dtype=np.float32)
rgb = rgb * alpha[:, :, np.newaxis] + bg * (1 - alpha[:, :, np.newaxis])
rgb = rgb.astype(np.uint8)
return rgb
def resize_with_aspect_ratio(image1, image2, pad_value=[255, 255, 255]):
aspect_ratio1 = float(image1.shape[1]) / float(image1.shape[0])
aspect_ratio2 = float(image2.shape[1]) / float(image2.shape[0])
top_pad, bottom_pad, left_pad, right_pad = 0, 0, 0, 0
if aspect_ratio1 < aspect_ratio2:
new_width = (aspect_ratio2 * image1.shape[0])
right_pad = left_pad = int((new_width - image1.shape[1]) / 2)
else:
new_height = (image1.shape[1] / aspect_ratio2)
bottom_pad = top_pad = int((new_height - image1.shape[0]) / 2)
image1_padded = cv2.copyMakeBorder(
image1, top_pad, bottom_pad, left_pad, right_pad, cv2.BORDER_CONSTANT, value=pad_value
)
return image1_padded
def estimate_img_mask(image):
# 转换为灰度图像
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
# 使用大津法进行阈值分割
# _, thresh = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)
# mask_otsu = thresh.astype(bool)
# thresh_gray = 240
# 使用 Canny 边缘检测算法找到边缘
edges = cv2.Canny(gray, 20, 50)
# 使用形态学操作扩展边缘
kernel = np.ones((3, 3), np.uint8)
edges_dilated = cv2.dilate(edges, kernel, iterations=1)
contours, _ = cv2.findContours(edges_dilated, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
# 创建一个空的 mask
mask = np.zeros_like(gray, dtype=np.uint8)
# 根据轮廓信息填充 mask(使用 thickness=cv2.FILLED 参数)
cv2.drawContours(mask, contours, -1, 255, thickness=cv2.FILLED)
mask = mask.astype(bool)
return mask
def compute_img_diff(img1, img2, matches1, matches1_from_2, vis=False):
scale = 0.125
gray_trunc_thres = 25 / 255.0
# Match
if matches1.shape[0] > 0:
match_scale = np.max(np.ptp(matches1, axis=-1))
match_dists = np.sqrt(np.sum((matches1 - matches1_from_2) ** 2, axis=-1))
dist_threshold = match_scale * 0.01
match_num = np.sum(match_dists <= dist_threshold)
match_rate = np.mean(match_dists <= dist_threshold)
else:
match_num = 0
match_rate = 0
# IOU
img1_mask = estimate_img_mask(img1)
img2_mask = estimate_img_mask(img2)
img_intersection = (img1_mask == 1) & (img2_mask == 1)
img_union = (img1_mask == 1) | (img2_mask == 1)
intersection = np.sum(img_intersection == 1)
union = np.sum(img_union == 1)
mask_iou = intersection / union if union != 0 else 0
# Gray
height, width = img1.shape[:2]
img1_gray = cv2.cvtColor(img1, cv2.COLOR_BGR2GRAY)
img2_gray = cv2.cvtColor(img2, cv2.COLOR_BGR2GRAY)
img1_gray = cv2.GaussianBlur(img1_gray, (7, 7), 0)
img2_gray = cv2.GaussianBlur(img2_gray, (7, 7), 0)
# Gray Diff
img1_gray_small = cv2.resize(img1_gray, (int(width * scale), int(height * scale)),
interpolation=cv2.INTER_LINEAR) / 255.0
img2_gray_small = cv2.resize(img2_gray, (int(width * scale), int(height * scale)),
interpolation=cv2.INTER_LINEAR) / 255.0
img_gray_small_diff = np.abs(img1_gray_small - img2_gray_small)
gray_diff = img_gray_small_diff.sum() / (union * scale) if union != 0 else 1
img_gray_small_diff_trunc = img_gray_small_diff.copy()
img_gray_small_diff_trunc[img_gray_small_diff < gray_trunc_thres] = 0
gray_diff_trunc = img_gray_small_diff_trunc.sum() / (union * scale) if union != 0 else 1
# Edge
img1_edge = cv2.Canny(img1_gray, 100, 200)
img2_edge = cv2.Canny(img2_gray, 100, 200)
bw_edges1 = (img1_edge > 0).astype(bool)
bw_edges2 = (img2_edge > 0).astype(bool)
hausdorff_dist = hausdorff_distance(bw_edges1, bw_edges2)
if vis == True:
fig, axs = plt.subplots(1, 4, figsize=(15, 5))
axs[0].imshow(img1_gray, cmap='gray')
axs[0].set_title('Img1')
axs[1].imshow(img2_gray, cmap='gray')
axs[1].set_title('Img2')
axs[2].imshow(img1_mask)
axs[2].set_title('Mask1')
axs[3].imshow(img2_mask)
axs[3].set_title('Mask2')
plt.show()
plt.figure()
mask_cmp = np.zeros((height, width, 3))
mask_cmp[img_intersection, 1] = 1
mask_cmp[img_union, 0] = 1
plt.imshow(mask_cmp)
plt.show()
fig, axs = plt.subplots(1, 4, figsize=(15, 5))
axs[0].imshow(img1_gray_small, cmap='gray')
axs[0].set_title('Img1 Gray')
axs[1].imshow(img2_gray_small, cmap='gray')
axs[1].set_title('Img2 Gary')
axs[2].imshow(img_gray_small_diff, cmap='gray')
axs[2].set_title('diff')
axs[3].imshow(img_gray_small_diff_trunc, cmap='gray')
axs[3].set_title('diff_trunct')
plt.show()
fig, axs = plt.subplots(1, 2, figsize=(15, 5))
axs[0].imshow(img1_edge, cmap='gray')
axs[0].set_title('img1_edge')
axs[1].imshow(img2_edge, cmap='gray')
axs[1].set_title('img2_edge')
plt.show()
info = {}
info['match_num'] = match_num
info['match_rate'] = match_rate
info['mask_iou'] = mask_iou
info['gray_diff'] = gray_diff
info['gray_diff_trunc'] = gray_diff_trunc
info['hausdorff_dist'] = hausdorff_dist
return info
def predict_match_success_human(info):
match_num = info['match_num']
match_rate = info['match_rate']
mask_iou = info['mask_iou']
gray_diff = info['gray_diff']
gray_diff_trunc = info['gray_diff_trunc']
hausdorff_dist = info['hausdorff_dist']
if mask_iou > 0.95:
return True
if match_num < 20 or match_rate < 0.7:
return False
if mask_iou > 0.80 and gray_diff < 0.040 and gray_diff_trunc < 0.010:
return True
if mask_iou > 0.70 and gray_diff < 0.050 and gray_diff_trunc < 0.008:
return True
'''
if match_rate<0.70 or match_num<3000:
return False
if (mask_iou>0.85 and hausdorff_dist<20)or (gray_diff<0.015 and gray_diff_trunc<0.01) or match_rate>=0.90:
return True
'''
return False
def predict_match_success(info, model=None):
if model == None:
return predict_match_success_human(info)
else:
feat_name = ['match_num', 'match_rate', 'mask_iou', 'gray_diff', 'gray_diff_trunc', 'hausdorff_dist']
# 提取特征
features = [info[f] for f in feat_name]
# 预测
pred = model.predict([features])[0]
return pred >= 0.5