Source code for openlifu.photoscan

from __future__ import annotations

import importlib
import json
import shutil
import subprocess
import tempfile
from dataclasses import dataclass
from pathlib import Path
from typing import Annotated, Dict, Tuple

import numpy as np
import OpenEXR
import trimesh
import vtk
from PIL import Image
from vtk.util.numpy_support import numpy_to_vtk

from openlifu.util.annotations import OpenLIFUFieldData


[docs] @dataclass class Photoscan: id: Annotated[str, OpenLIFUFieldData("Photoscan ID", "ID of this photoscan")] = "photoscan" """ID of this photoscan""" name: Annotated[str, OpenLIFUFieldData("Photoscan name", "Photoscan name")] = "Photoscan" """Photoscan name""" model_filename: Annotated[str | None, OpenLIFUFieldData("Model filename", "Relative path to model")] = None """Relative path to model""" texture_filename: Annotated[str | None, OpenLIFUFieldData("Texture filename", "Relative path to texture image")] = None """Relative path to texture image""" mtl_filename: Annotated[str | None, OpenLIFUFieldData("Material filename", "Relative path to materials file")] = None """Relative path to materials file""" photoscan_approved: Annotated[bool, OpenLIFUFieldData("Approved?", "Approval state of the photoscan. 'True' means the user has provided some kind of confirmation that the photoscan is good enough to be used.")] = False """Approval state of the photoscan. 'True' means the user has provided some kind of confirmation that the photoscan is good enough to be used."""
[docs] @staticmethod def from_json(json_string: str) -> Photoscan: """Load a Photoscan from a json string""" return Photoscan.from_dict(json.loads(json_string))
[docs] def to_json(self, compact: bool) -> str: """Serialize a Photoscan to a json string. This is different to the format written to file and does not contain the loaded models and texture. Args: compact:if enabled then the string is compact (not pretty). Disable for pretty. Returns: A json string representing the complete Photoscan object """ from openlifu.util.json import PYFUSEncoder if compact: return json.dumps(self.to_dict(), separators=(',', ':'), cls=PYFUSEncoder) else: return json.dumps(self.to_dict(), indent=4, cls=PYFUSEncoder)
[docs] @staticmethod def from_dict(d:Dict) -> Photoscan: """ Create a Photoscan from a dictionary param d: Dictionary of photoscan parameters. returns: Photoscan object """ return Photoscan(**d)
[docs] def to_dict(self) -> Dict: """ Convert the photoscan to a dictionary returns: Dictionary of photoscan parameters """ d = self.__dict__.copy() return d
[docs] @staticmethod def from_file(filename) -> Photoscan: """ Load a Photoscan from a metadata file :param filename: Name of the file """ with open(filename) as f: return Photoscan.from_dict(json.load(f))
[docs] def to_file(self, filename): """ Save the photoscan to a file. :param filename: Name of the file """ Path(filename).parent.parent.mkdir(exist_ok=True) #photoscan directory Path(filename).parent.mkdir(exist_ok=True) with open(filename, 'w') as file: file.write(self.to_json(compact = False))
[docs] def load_data_from_filepaths(model_abspath: str, texture_abspath: str) -> Tuple[vtk.vtkPolyData, vtk.vtkImageData]: """ This function returns the data directly from the model and texture filepaths without requiring a photoscan object. param model_abspath: absolute filepath to model data texture abspath: absolute filepath to texture data Returns: Photoscan data as (model_vtkpolydata, texture_vtkimagedata) """ model_polydata = load_model(model_abspath) texture_imagedata = load_texture(texture_abspath) return (model_polydata, texture_imagedata)
[docs] def load_data_from_photoscan(photoscan: Photoscan, parent_dir) -> Tuple[vtk.vtkPolyData, vtk.vtkImageData]: """ param parent_dir: parent directory containing model and texture data filepaths Returns: Photoscan data as (model_vtkpolydata, texture_vtkimagedata) """ model_polydata = load_model(Path(parent_dir)/photoscan.model_filename) texture_imagedata = load_texture(Path(parent_dir)/photoscan.texture_filename) return (model_polydata, texture_imagedata)
[docs] def load_model(file_name) -> vtk.vtkPolyData: """ This function assumes that the model is saved to file in LPS coordinates. The model that is returned is in RAS coordinates """ if not Path(file_name).exists(): raise FileNotFoundError(f'Model filepath does not exist: {file_name}') mesh = read_as_vtkpolydata(file_name) mesh_ras = convert_between_ras_and_lps(mesh) return mesh_ras
[docs] def load_texture(file_name) -> vtk.vtkImageData: if not Path(file_name).exists(): raise FileNotFoundError(f'Texture data filepath does not exist: {file_name}') texture = read_as_vtkimagedata(file_name) return texture
[docs] def read_as_vtkpolydata(file_name): suffix_to_reader_dict = { '.ply' : vtk.vtkPLYReader, '.vtp' : vtk.vtkXMLPolyDataReader, '.obj' : vtk.vtkOBJReader, '.stl' : vtk.vtkSTLReader, '.vtk' : vtk.vtkPolyDataReader, '.g' : vtk.vtkBYUReader } path = Path(file_name) ext = path.suffix.lower() if path.suffix not in suffix_to_reader_dict: raise ValueError(f"File format {ext} not supported by reader") reader = suffix_to_reader_dict[ext]() if ext == '.g': reader.SetGeometryName(file_name) else: reader.SetFileName(file_name) reader.Update() poly_data = reader.GetOutput() return poly_data
[docs] def convert_numpy_to_vtkimage(image_numpy: np.ndarray) -> vtk.vtkImageData: """ Converts a numpy array with dimensions [HxWx3] representing an RGB image into vtkImageData """ vtkimage_data = vtk.vtkImageData() vtkimage_data.SetDimensions(image_numpy.shape[1], image_numpy.shape[0], 1) vtkimage_data.SetNumberOfScalarComponents(image_numpy.shape[2], vtkimage_data.GetInformation()) pd = vtkimage_data.GetPointData() new_rgb_data = image_numpy.reshape((-1, image_numpy.shape[2])) vtk_array = numpy_to_vtk(new_rgb_data, deep=True, array_type=vtk.VTK_UNSIGNED_SHORT) pd.SetScalars(vtk_array) return vtkimage_data
[docs] def read_as_vtkimagedata(file_name) -> vtk.vtkImageData: suffix_to_reader_dict = { '.jpg' : vtk.vtkJPEGReader, '.png' : vtk.vtkPNGReader, '.tiff' : vtk.vtkTIFFReader, } path = Path(file_name) ext = path.suffix.lower() if ext == '.exr': with OpenEXR.File(str(file_name), separate_channels = True) as exr_file: R = exr_file.channels()['R'].pixels G = exr_file.channels()['G'].pixels B = exr_file.channels()['B'].pixels # Combine channels into a single RGB image (H x W x 3) rgb_data = np.stack([R, G, B], axis=-1, dtype = np.float32) # EXR stores pixel data using half 16-bit floating point values. Convert data to an 8-bit image compatibility with VTK rgb_data = np.clip(rgb_data*(2**16-1), 0, 65535) image_data = convert_numpy_to_vtkimage(rgb_data) elif ext in suffix_to_reader_dict: reader = suffix_to_reader_dict[ext]() reader.SetFileName(file_name) reader.Update() image_data = reader.GetOutput() else: raise ValueError(f"File format {path.suffix} not supported by reader") return image_data
[docs] def convert_between_ras_and_lps(mesh : vtk.vtkPointSet) -> vtk.vtkPointSet: """Converts a mesh (polydata, unstructured grid or even just a point cloud) between the LPS (left-posterior-superior) coordinate system and RAS (right-anterior-superior) coordinate system.""" transform_ras_to_lps = vtk.vtkTransform() transform_ras_to_lps.Scale(-1,-1,1) transformFilter = vtk.vtkTransformPolyDataFilter() transformFilter.SetInputData(mesh) transformFilter.SetTransform(transform_ras_to_lps) transformFilter.Update() return transformFilter.GetOutput()
[docs] def run_reconstruction(images: list[Path], pipeline: Path | None = None) -> Tuple[Photoscan,Path]: """Run Meshroom with the given images and pipeline. Args: images (list[Path]): List of image file paths. pipeline (Path): Path to the Meshroom pipeline file. Returns: photoscan: The Photoscan of the reconstructed images. data_dir (Path): The directory containing the underlying data files whose names are given in the Photoscan. """ if pipeline is None: pipeline = importlib.resources.files("openlifu.meshroom_pipelines") / "default_pipeline.mg" if shutil.which("meshroom_batch") is None: raise FileNotFoundError("Error: 'meshroom_batch' is not found in system PATH. Ensure it is installed and accessible.") if not Path.exists(pipeline): raise FileNotFoundError(f"Error: The pipeline file '{pipeline}' does not exist.") temp_dir = Path(tempfile.mkdtemp()) images_dir = temp_dir / "images" images_dir.mkdir(parents=True, exist_ok=True) for image in images: shutil.copy(image, images_dir / image.name) output_dir = temp_dir / "output" cache_dir = temp_dir / "cache" command = [ "meshroom_batch", "--pipeline", str(pipeline), "--output", str(output_dir), "--input", str(images_dir), "--cache", str(cache_dir) ] subprocess.run(command, check=True) output_dir_merged = temp_dir / "output_dir_merged" output_dir_merged.mkdir(parents=True, exist_ok=True) merge_textures(output_dir / "texturedMesh.obj", output_dir_merged) photoscan_dict = { "model_filename": "texturedMesh.obj", "texture_filename": "material_0.png", "mtl_filename": "material.mtl", } photoscan = Photoscan.from_dict(photoscan_dict) return photoscan, output_dir_merged
[docs] def udim_to_tile(udim_str: str) -> Tuple[int, int]: x = int(udim_str[-2:]) - 1 tile_u = x % 10 tile_v = x // 10 return tile_u, tile_v
[docs] def merge_textures(input_obj_path: Path, output_path: Path) -> None: scene = trimesh.load(input_obj_path, process=True) if isinstance(scene, trimesh.Scene): mesh_dict = scene.geometry else: mesh_dict = {'material_1001': scene} for name, mesh in mesh_dict.items(): mesh.tile = udim_to_tile(name[-4:]) num_u_tiles = max(mesh.tile[0] for _, mesh in mesh_dict.items()) + 1 num_v_tiles = max(mesh.tile[1] for _, mesh in mesh_dict.items()) + 1 first_tile = np.array(mesh_dict['material_1001'].visual.material.image) tile_height, tile_width, tile_ch = first_tile.shape tex_height, tex_width = num_v_tiles*tile_height, num_u_tiles*tile_height new_texture = np.zeros((tex_height, tex_width, tile_ch), dtype=first_tile.dtype) new_verts = [] new_faces = [] new_uvs = [] num_verts = 0 for _, mesh in mesh_dict.items(): tile_u, tile_v = mesh.tile texture_tile = np.array(mesh.visual.material.image) new_texture[tex_height - tile_height*(tile_v+1): tex_height-tile_height*tile_v, tile_width*tile_u:tile_width*(tile_u+1)] = texture_tile new_verts.append(mesh.vertices) new_faces.append(mesh.faces+num_verts) new_uvs.append(mesh.visual.uv) num_verts += mesh.vertices.shape[0] new_texture = Image.fromarray(new_texture) new_verts = np.concatenate(new_verts, axis=0) new_faces = np.concatenate(new_faces, axis=0) new_uvs = np.concatenate(new_uvs, axis=0) new_uvs = new_uvs/np.array([num_u_tiles, num_v_tiles]).reshape(-1,2) mesh = trimesh.Trimesh() #Note putting vertices in this constructor will merge nearby ones mesh.vertices = new_verts mesh.faces = new_faces mesh.visual = trimesh.visual.TextureVisuals(uv=new_uvs, image=new_texture) mesh.export(output_path / "texturedMesh.obj")