Spaces:

Nike4D
/

3dmodelmaker

Running

3dmodelmaker / src /extracted_objects_model.py

ikeda

translate Japanese comments to English

6810bed over 1 year ago

10.4 kB

	import io
	import numpy as np
	from PIL import Image as PIL_Image # Renaming to avoid conflict with Image from gltflib
	import cv2
	import struct
	import triangle
	import uuid

	from gltflib import (
	GLTF, GLTFModel, Asset, Scene, Node, Mesh, Primitive, Attributes, Buffer, BufferView, Image, Texture, TextureInfo, Material, Sampler, Accessor, AccessorType,
	BufferTarget, ComponentType, GLBResource, PBRMetallicRoughness)

	# Create vertex lists for both the front and back surfaces
	def make_front_and_back_vertex_list(coordinate_list, img):

	# Front surface vertices
	front_vertex_list = []
	# Back surface vertices
	back_vertex_list = []
	for coordinates in coordinate_list:
	front_vertices = []
	back_vertices = []
	# Note that the Y-axis direction is inverted between the image and GLB, so be careful
	for coordinate in coordinates:
	front_vertices.append((coordinate[0] * 2 / img.size[0] - 1.0, -(coordinate[1] * 2 / img.size[1] - 1.0), 0.2))
	back_vertices.append((coordinate[0] * 2 / img.size[0] - 1.0, -(coordinate[1] * 2 / img.size[1] - 1.0), -0.2))

	front_vertex_list.append(front_vertices)
	back_vertex_list.append(back_vertices)

	return front_vertex_list, back_vertex_list

	# Creation of various information for the mesh
	def make_mesh_data(coordinate_list, img):
	front_vertex_list, back_vertex_list = make_front_and_back_vertex_list(coordinate_list, img)

	# Vertex data(POSITION)
	vertices = []
	# List of offset values used when determining vertex indices
	front_offset = 0
	front_offset_list = []
	back_offset_list = []
	for front_vertices, back_vertices in zip(front_vertex_list, back_vertex_list):
	vertices.extend(front_vertices)
	vertices.extend(back_vertices)

	back_offset = front_offset + len(front_vertices)
	front_offset_list.append(front_offset)
	back_offset_list.append(back_offset)
	front_offset += len(front_vertices) + len(back_vertices)

	# Normal data(NORMAL)
	normals = []
	for front_vertices, back_vertices in zip(front_vertex_list, back_vertex_list):
	normals.extend([( 0.0, 0.0, 1.0)] * len(front_vertices))
	normals.extend([( 0.0, 0.0, -1.0)] * len(back_vertices))

	# Texture coordinates (TEXCOORD_0)
	# The image origin is at the top-left, requiring an inversion of the Y-axis.
	texcoord_0s = [((vertex[0] + 1.0) / 2.0, 1.0 - ((vertex[1] + 1.0) / 2.0) ) for vertex in vertices]

	# Vertex indices
	vertex_indices = []
	for front_vertices, back_vertices, front_offset, back_offset \
	in zip(front_vertex_list, back_vertex_list, front_offset_list, back_offset_list):
	polygon = {
	'vertices': np.array(front_vertices)[:, :2],
	'segments': np.array([( i, (i + 1) % (len(front_vertices)) ) for i in range(len(front_vertices))]) # Define each edge
	}
	triangulate_result = triangle.triangulate(polygon, 'p')
	vertex_indices.extend(list(np.array(triangulate_result['triangles']+front_offset).flatten())) # Front surface
	vertex_indices.extend(list((np.array(triangulate_result['triangles'])+back_offset).flatten())) # Back surface
	vertex_indices.extend(list(np.array([[front_offset + i,
	front_offset + (i + 1) % len(front_vertices),
	back_offset + i]
	for i in range(len(front_vertices))]).flatten())) # Side surface 1
	vertex_indices.extend(list(np.array([[back_offset + i,
	back_offset + (i + 1) % len(back_vertices),
	front_offset+ (i + 1) % len(front_vertices)] for i in range(len(front_vertices))]).flatten())) # Side surface 2

	return vertices, normals, texcoord_0s, vertex_indices

	def create_extracted_objects_model(img_bytearray):

	# Retrieve the image
	img = PIL_Image.open(img_bytearray).convert('RGB')
	img_bytearray = io.BytesIO()
	img.save(img_bytearray, format="JPEG", quality=95)
	img_bytearray = img_bytearray.getvalue()
	img_bytelen = len(img_bytearray)

	# Calculate the scale of the 3D model
	scale_factor = np.power(img.size[0] * img.size[1], 0.5)
	scale = (img.size[0] / scale_factor, img.size[1] / scale_factor, 0.4)

	# Retrieve vertices of the main part of the image
	base_color = img.getpixel((0, 0))
	mask = PIL_Image.new('RGB', img.size)
	for i in range(img.size[0]):
	for j in range(img.size[1]):
	if base_color == img.getpixel((i, j)):
	mask.putpixel((i, j), (0, 0, 0))
	else:
	mask.putpixel((i, j), (255, 255, 255))

	opening = cv2.morphologyEx(np.array(mask), cv2.MORPH_OPEN, kernel=np.ones((15, 15),np.uint8))
	contours, _ = cv2.findContours(cv2.cvtColor(np.array(opening), cv2.COLOR_RGB2GRAY), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)
	coordinate_list = []
	for contour in contours:
	coordinates = []
	for [[x, y]] in contour:
	coordinates.append((x, y))
	coordinate_list.append(coordinates)

	# Creation of associated data for the mesh
	vertices, normals, texcoord_0s, vertex_indices = make_mesh_data(coordinate_list, img)

	# Vertex data(POSITION)
	vertex_bytearray = bytearray()
	for vertex in vertices:
	for value in vertex:
	vertex_bytearray.extend(struct.pack('f', value))
	vertex_bytelen = len(vertex_bytearray)
	mins = [min([vertex[i] for vertex in vertices]) for i in range(3)]
	maxs = [max([vertex[i] for vertex in vertices]) for i in range(3)]

	# Normal data(NORMAL)
	normal_bytearray = bytearray()
	for normal in normals:
	for value in normal:
	normal_bytearray.extend(struct.pack('f', value))
	normal_bytelen = len(normal_bytearray)

	# Texture coordinates(TEXCOORD_0)
	texcoord_0s = [
	((vertex[0] + 1.0) / 2.0, 1.0 - ((vertex[1] + 1.0) / 2.0) ) for vertex in vertices
	]
	texcoord_0_bytearray = bytearray()
	for texcoord_0 in texcoord_0s:
	for value in texcoord_0:
	texcoord_0_bytearray.extend(struct.pack('f', value))
	texcoord_0_bytelen = len(texcoord_0_bytearray)

	# Vertex indices
	vertex_index_bytearray = bytearray()
	for value in vertex_indices:
	vertex_index_bytearray.extend(struct.pack('H', value))
	vertex_index_bytelen = len(vertex_index_bytearray)

	# Concatenation of the binary data section
	bytearray_list = [
	vertex_bytearray,
	normal_bytearray,
	texcoord_0_bytearray,
	vertex_index_bytearray,
	img_bytearray,
	]
	bytelen_list = [
	vertex_bytelen,
	normal_bytelen,
	texcoord_0_bytelen,
	vertex_index_bytelen,
	img_bytelen,
	]
	bytelen_cumsum_list = list(np.cumsum(bytelen_list))
	bytelen_cumsum_list = list(map(lambda x: int(x), bytelen_cumsum_list))

	all_bytearray = bytearray()
	for temp_bytearray in bytearray_list:
	all_bytearray.extend(temp_bytearray)
	offset_list = [0] + bytelen_cumsum_list # The first offset is 0
	offset_list.pop() # 末尾を削除

	# GLBResource
	resources = [GLBResource(data=all_bytearray)]

	# Asset
	asset=Asset()

	# Buffer
	buffers = [Buffer(byteLength=len(all_bytearray))]

	# BufferView
	bufferViews = [
	BufferView(buffer=0, byteOffset=offset_list[0], byteLength=bytelen_list[0], target=BufferTarget.ARRAY_BUFFER.value),
	BufferView(buffer=0, byteOffset=offset_list[1], byteLength=bytelen_list[1], target=BufferTarget.ARRAY_BUFFER.value),
	BufferView(buffer=0, byteOffset=offset_list[2], byteLength=bytelen_list[2], target=BufferTarget.ARRAY_BUFFER.value),
	BufferView(buffer=0, byteOffset=offset_list[3], byteLength=bytelen_list[3], target=BufferTarget.ELEMENT_ARRAY_BUFFER.value),
	BufferView(buffer=0, byteOffset=offset_list[4], byteLength=bytelen_list[4], target=None),
	]

	# Accessor
	accessors = [
	Accessor(bufferView=0, componentType=ComponentType.FLOAT.value, count=len(vertices), type=AccessorType.VEC3.value, max=maxs, min=mins),
	Accessor(bufferView=1, componentType=ComponentType.FLOAT.value, count=len(normals), type=AccessorType.VEC3.value, max=None, min=None),
	Accessor(bufferView=2, componentType=ComponentType.FLOAT.value, count=len(texcoord_0s), type=AccessorType.VEC2.value, max=None, min=None),
	Accessor(bufferView=3, componentType=ComponentType.UNSIGNED_SHORT.value, count=len(vertex_indices), type=AccessorType.SCALAR.value, max=None, min=None)
	]

	# Image
	images=[
	Image(mimeType='image/jpeg', bufferView=4),
	]

	# Sampler
	samplers = [Sampler(magFilter=9728, minFilter=9984)] # magFilter:最近傍フィルタリング、minFilter:ミップマップ+最近傍フィルタリング

	# Texture
	textures = [
	Texture(name='Main',sampler=0,source=0),
	]

	# Material
	materials = [
	Material(
	pbrMetallicRoughness=PBRMetallicRoughness(
	baseColorTexture=TextureInfo(index=0),
	metallicFactor=0,
	roughnessFactor=1
	),
	name='Material0',
	alphaMode='OPAQUE',
	doubleSided=True
	),
	]

	# Mesh
	meshes = [
	Mesh(name='Main', primitives=[Primitive(attributes=Attributes(POSITION=0, NORMAL=1,TEXCOORD_0=2),
	indices=3, material=0, mode=4)]),
	]

	# Node
	nodes = [
	Node(mesh=0,rotation=None, scale=scale),
	]

	# Scene
	scene = 0
	scenes = [Scene(name='Scene', nodes=[0])]

	# GLTFModel
	model = GLTFModel(
	asset=asset,
	buffers=buffers,
	bufferViews=bufferViews,
	accessors=accessors,
	images=images,
	samplers=samplers,
	textures=textures,
	materials=materials,
	meshes=meshes,
	nodes=nodes,
	scene=scene,
	scenes=scenes
	)

	gltf = GLTF(model=model, resources=resources)

	tmp_filename = uuid.uuid4().hex
	model_path = f'../tmp/{tmp_filename}.glb'

	gltf.export(model_path)

	return model_path