|
from typing import Any |
|
|
|
import numpy as np |
|
import rembg |
|
import torch |
|
from PIL import Image |
|
|
|
import sf3d.models.utils as sf3d_utils |
|
|
|
|
|
def create_intrinsic_from_fov_deg(fov_deg: float, cond_height: int, cond_width: int): |
|
intrinsic = sf3d_utils.get_intrinsic_from_fov( |
|
np.deg2rad(fov_deg), |
|
H=cond_height, |
|
W=cond_width, |
|
) |
|
intrinsic_normed_cond = intrinsic.clone() |
|
intrinsic_normed_cond[..., 0, 2] /= cond_width |
|
intrinsic_normed_cond[..., 1, 2] /= cond_height |
|
intrinsic_normed_cond[..., 0, 0] /= cond_width |
|
intrinsic_normed_cond[..., 1, 1] /= cond_height |
|
|
|
return intrinsic, intrinsic_normed_cond |
|
|
|
|
|
def default_cond_c2w(distance: float): |
|
c2w_cond = torch.as_tensor( |
|
[ |
|
[0, 0, 1, distance], |
|
[1, 0, 0, 0], |
|
[0, 1, 0, 0], |
|
[0, 0, 0, 1], |
|
] |
|
).float() |
|
return c2w_cond |
|
|
|
|
|
def remove_background( |
|
image: Image, |
|
rembg_session: Any = None, |
|
force: bool = False, |
|
**rembg_kwargs, |
|
) -> Image: |
|
do_remove = True |
|
if image.mode == "RGBA" and image.getextrema()[3][0] < 255: |
|
do_remove = False |
|
do_remove = do_remove or force |
|
if do_remove: |
|
image = rembg.remove(image, session=rembg_session, **rembg_kwargs) |
|
return image |
|
|
|
|
|
def resize_foreground( |
|
image: Image, |
|
ratio: float, |
|
) -> Image: |
|
image = np.array(image) |
|
assert image.shape[-1] == 4 |
|
alpha = np.where(image[..., 3] > 0) |
|
y1, y2, x1, x2 = ( |
|
alpha[0].min(), |
|
alpha[0].max(), |
|
alpha[1].min(), |
|
alpha[1].max(), |
|
) |
|
|
|
fg = image[y1:y2, x1:x2] |
|
|
|
size = max(fg.shape[0], fg.shape[1]) |
|
ph0, pw0 = (size - fg.shape[0]) // 2, (size - fg.shape[1]) // 2 |
|
ph1, pw1 = size - fg.shape[0] - ph0, size - fg.shape[1] - pw0 |
|
new_image = np.pad( |
|
fg, |
|
((ph0, ph1), (pw0, pw1), (0, 0)), |
|
mode="constant", |
|
constant_values=((0, 0), (0, 0), (0, 0)), |
|
) |
|
|
|
|
|
new_size = int(new_image.shape[0] / ratio) |
|
|
|
ph0, pw0 = (new_size - size) // 2, (new_size - size) // 2 |
|
ph1, pw1 = new_size - size - ph0, new_size - size - pw0 |
|
new_image = np.pad( |
|
new_image, |
|
((ph0, ph1), (pw0, pw1), (0, 0)), |
|
mode="constant", |
|
constant_values=((0, 0), (0, 0), (0, 0)), |
|
) |
|
new_image = Image.fromarray(new_image, mode="RGBA") |
|
return new_image |
|
|