kushbhargav
/

image_to_3d

Model card Files Files and versions Community

image_to_3d / trellis /renderers /gaussian_render.py

kushbhargav

Upload 194 files

62a650e verified about 1 month ago

raw

history blame contribute delete

8.35 kB

	#
	# Copyright (C) 2023, Inria
	# GRAPHDECO research group, https://team.inria.fr/graphdeco
	# All rights reserved.
	#
	# This software is free for non-commercial, research and evaluation use
	# under the terms of the LICENSE.md file.
	#
	# For inquiries contact [email protected]
	#

	import torch
	import math
	from easydict import EasyDict as edict
	import numpy as np
	from ..representations.gaussian import Gaussian
	from .sh_utils import eval_sh
	import torch.nn.functional as F
	from easydict import EasyDict as edict


	def intrinsics_to_projection(
	intrinsics: torch.Tensor,
	near: float,
	far: float,
	) -> torch.Tensor:
	"""
	OpenCV intrinsics to OpenGL perspective matrix

	Args:
	intrinsics (torch.Tensor): [3, 3] OpenCV intrinsics matrix
	near (float): near plane to clip
	far (float): far plane to clip
	Returns:
	(torch.Tensor): [4, 4] OpenGL perspective matrix
	"""
	fx, fy = intrinsics[0, 0], intrinsics[1, 1]
	cx, cy = intrinsics[0, 2], intrinsics[1, 2]
	ret = torch.zeros((4, 4), dtype=intrinsics.dtype, device=intrinsics.device)
	ret[0, 0] = 2 * fx
	ret[1, 1] = 2 * fy
	ret[0, 2] = 2 * cx - 1
	ret[1, 2] = - 2 * cy + 1
	ret[2, 2] = far / (far - near)
	ret[2, 3] = near * far / (near - far)
	ret[3, 2] = 1.
	return ret


	def render(viewpoint_camera, pc : Gaussian, pipe, bg_color : torch.Tensor, scaling_modifier = 1.0, override_color = None):
	"""
	Render the scene.

	Background tensor (bg_color) must be on GPU!
	"""
	# lazy import
	if 'GaussianRasterizer' not in globals():
	from diff_gaussian_rasterization import GaussianRasterizer, GaussianRasterizationSettings

	# Create zero tensor. We will use it to make pytorch return gradients of the 2D (screen-space) means
	screenspace_points = torch.zeros_like(pc.get_xyz, dtype=pc.get_xyz.dtype, requires_grad=True, device="cuda") + 0
	try:
	screenspace_points.retain_grad()
	except:
	pass
	# Set up rasterization configuration
	tanfovx = math.tan(viewpoint_camera.FoVx * 0.5)
	tanfovy = math.tan(viewpoint_camera.FoVy * 0.5)

	kernel_size = pipe.kernel_size
	subpixel_offset = torch.zeros((int(viewpoint_camera.image_height), int(viewpoint_camera.image_width), 2), dtype=torch.float32, device="cuda")

	raster_settings = GaussianRasterizationSettings(
	image_height=int(viewpoint_camera.image_height),
	image_width=int(viewpoint_camera.image_width),
	tanfovx=tanfovx,
	tanfovy=tanfovy,
	kernel_size=kernel_size,
	subpixel_offset=subpixel_offset,
	bg=bg_color,
	scale_modifier=scaling_modifier,
	viewmatrix=viewpoint_camera.world_view_transform,
	projmatrix=viewpoint_camera.full_proj_transform,
	sh_degree=pc.active_sh_degree,
	campos=viewpoint_camera.camera_center,
	prefiltered=False,
	debug=pipe.debug
	)

	rasterizer = GaussianRasterizer(raster_settings=raster_settings)

	means3D = pc.get_xyz
	means2D = screenspace_points
	opacity = pc.get_opacity

	# If precomputed 3d covariance is provided, use it. If not, then it will be computed from
	# scaling / rotation by the rasterizer.
	scales = None
	rotations = None
	cov3D_precomp = None
	if pipe.compute_cov3D_python:
	cov3D_precomp = pc.get_covariance(scaling_modifier)
	else:
	scales = pc.get_scaling
	rotations = pc.get_rotation

	# If precomputed colors are provided, use them. Otherwise, if it is desired to precompute colors
	# from SHs in Python, do it. If not, then SH -> RGB conversion will be done by rasterizer.
	shs = None
	colors_precomp = None
	if override_color is None:
	if pipe.convert_SHs_python:
	shs_view = pc.get_features.transpose(1, 2).view(-1, 3, (pc.max_sh_degree+1)**2)
	dir_pp = (pc.get_xyz - viewpoint_camera.camera_center.repeat(pc.get_features.shape[0], 1))
	dir_pp_normalized = dir_pp/dir_pp.norm(dim=1, keepdim=True)
	sh2rgb = eval_sh(pc.active_sh_degree, shs_view, dir_pp_normalized)
	colors_precomp = torch.clamp_min(sh2rgb + 0.5, 0.0)
	else:
	shs = pc.get_features
	else:
	colors_precomp = override_color

	# Rasterize visible Gaussians to image, obtain their radii (on screen).
	rendered_image, radii = rasterizer(
	means3D = means3D,
	means2D = means2D,
	shs = shs,
	colors_precomp = colors_precomp,
	opacities = opacity,
	scales = scales,
	rotations = rotations,
	cov3D_precomp = cov3D_precomp
	)

	# Those Gaussians that were frustum culled or had a radius of 0 were not visible.
	# They will be excluded from value updates used in the splitting criteria.
	return edict({"render": rendered_image,
	"viewspace_points": screenspace_points,
	"visibility_filter" : radii > 0,
	"radii": radii})


	class GaussianRenderer:
	"""
	Renderer for the Voxel representation.

	Args:
	rendering_options (dict): Rendering options.
	"""

	def __init__(self, rendering_options={}) -> None:
	self.pipe = edict({
	"kernel_size": 0.1,
	"convert_SHs_python": False,
	"compute_cov3D_python": False,
	"scale_modifier": 1.0,
	"debug": False
	})
	self.rendering_options = edict({
	"resolution": None,
	"near": None,
	"far": None,
	"ssaa": 1,
	"bg_color": 'random',
	})
	self.rendering_options.update(rendering_options)
	self.bg_color = None

	def render(
	self,
	gausssian: Gaussian,
	extrinsics: torch.Tensor,
	intrinsics: torch.Tensor,
	colors_overwrite: torch.Tensor = None
	) -> edict:
	"""
	Render the gausssian.

	Args:
	gaussian : gaussianmodule
	extrinsics (torch.Tensor): (4, 4) camera extrinsics
	intrinsics (torch.Tensor): (3, 3) camera intrinsics
	colors_overwrite (torch.Tensor): (N, 3) override color

	Returns:
	edict containing:
	color (torch.Tensor): (3, H, W) rendered color image
	"""
	resolution = self.rendering_options["resolution"]
	near = self.rendering_options["near"]
	far = self.rendering_options["far"]
	ssaa = self.rendering_options["ssaa"]

	if self.rendering_options["bg_color"] == 'random':
	self.bg_color = torch.zeros(3, dtype=torch.float32, device="cuda")
	if np.random.rand() < 0.5:
	self.bg_color += 1
	else:
	self.bg_color = torch.tensor(self.rendering_options["bg_color"], dtype=torch.float32, device="cuda")

	view = extrinsics
	perspective = intrinsics_to_projection(intrinsics, near, far)
	camera = torch.inverse(view)[:3, 3]
	focalx = intrinsics[0, 0]
	focaly = intrinsics[1, 1]
	fovx = 2 * torch.atan(0.5 / focalx)
	fovy = 2 * torch.atan(0.5 / focaly)

	camera_dict = edict({
	"image_height": resolution * ssaa,
	"image_width": resolution * ssaa,
	"FoVx": fovx,
	"FoVy": fovy,
	"znear": near,
	"zfar": far,
	"world_view_transform": view.T.contiguous(),
	"projection_matrix": perspective.T.contiguous(),
	"full_proj_transform": (perspective @ view).T.contiguous(),
	"camera_center": camera
	})

	# Render
	render_ret = render(camera_dict, gausssian, self.pipe, self.bg_color, override_color=colors_overwrite, scaling_modifier=self.pipe.scale_modifier)

	if ssaa > 1:
	render_ret.render = F.interpolate(render_ret.render[None], size=(resolution, resolution), mode='bilinear', align_corners=False, antialias=True).squeeze()

	ret = edict({
	'color': render_ret['render']
	})
	return ret