Spaces:

stabilityai
/

stable-fast-3d

Running on L4

Aaryaman Vasishta

Update to latest inference code

77d8010 10 months ago

2.7 kB

	import os
	from typing import Any, Union

	import numpy as np
	import rembg
	import torch
	import torchvision.transforms.functional as torchvision_F
	from PIL import Image

	import sf3d.models.utils as sf3d_utils


	def get_device():
	if os.environ.get("SF3D_USE_CPU", "0") == "1":
	return "cpu"

	device = "cpu"
	if torch.cuda.is_available():
	device = "cuda"
	elif torch.backends.mps.is_available():
	device = "mps"
	return device


	def create_intrinsic_from_fov_deg(fov_deg: float, cond_height: int, cond_width: int):
	intrinsic = sf3d_utils.get_intrinsic_from_fov(
	np.deg2rad(fov_deg),
	H=cond_height,
	W=cond_width,
	)
	intrinsic_normed_cond = intrinsic.clone()
	intrinsic_normed_cond[..., 0, 2] /= cond_width
	intrinsic_normed_cond[..., 1, 2] /= cond_height
	intrinsic_normed_cond[..., 0, 0] /= cond_width
	intrinsic_normed_cond[..., 1, 1] /= cond_height

	return intrinsic, intrinsic_normed_cond


	def default_cond_c2w(distance: float):
	c2w_cond = torch.as_tensor(
	[
	[0, 0, 1, distance],
	[1, 0, 0, 0],
	[0, 1, 0, 0],
	[0, 0, 0, 1],
	]
	).float()
	return c2w_cond


	def remove_background(
	image: Image,
	rembg_session: Any = None,
	force: bool = False,
	**rembg_kwargs,
	) -> Image:
	do_remove = True
	if image.mode == "RGBA" and image.getextrema()[3][0] < 255:
	do_remove = False
	do_remove = do_remove or force
	if do_remove:
	image = rembg.remove(image, session=rembg_session, **rembg_kwargs)
	return image


	def get_1d_bounds(arr):
	nz = np.flatnonzero(arr)
	return nz[0], nz[-1]


	def get_bbox_from_mask(mask, thr=0.5):
	masks_for_box = (mask > thr).astype(np.float32)
	assert masks_for_box.sum() > 0, "Empty mask!"
	x0, x1 = get_1d_bounds(masks_for_box.sum(axis=-2))
	y0, y1 = get_1d_bounds(masks_for_box.sum(axis=-1))
	return x0, y0, x1, y1


	def resize_foreground(
	image: Union[Image.Image, np.ndarray],
	ratio: float,
	out_size=None,
	) -> Image:
	if isinstance(image, np.ndarray):
	image = Image.fromarray(image, mode="RGBA")
	assert image.mode == "RGBA"
	# Get bounding box
	mask_np = np.array(image)[:, :, -1]
	x1, y1, x2, y2 = get_bbox_from_mask(mask_np, thr=0.5)
	h, w = y2 - y1, x2 - x1
	yc, xc = (y1 + y2) / 2, (x1 + x2) / 2
	scale = max(h, w) / ratio

	new_image = torchvision_F.crop(
	image,
	top=int(yc - scale / 2),
	left=int(xc - scale / 2),
	height=int(scale),
	width=int(scale),
	)
	if out_size is not None:
	new_image = new_image.resize(out_size)

	return new_image