STCFormer_hp/common/camera.py


								import sys

								import numpy as np

								import torch


								def normalize_screen_coordinates(X, w, h):

								    assert X.shape[-1] == 2

								    return X / w * 2 - [1, h / w]


								def image_coordinates(X, w, h):

								    assert X.shape[-1] == 2


								    # Reverse camera frame normalization

								    return (X + [1, h / w]) * w / 2


								def world_to_camera(X, R, t):

								    Rt = wrap(qinverse, R)

								    return wrap(qrot, np.tile(Rt, (*X.shape[:-1], 1)), X - t)


								def camera_to_world(X, R, t):

								    return wrap(qrot, np.tile(R, (*X.shape[:-1], 1)), X) + t


								def wrap(func, *args, unsqueeze=False):

								    args = list(args)

								    for i, arg in enumerate(args):

								        if type(arg) == np.ndarray:

								            args[i] = torch.from_numpy(arg)

								            if unsqueeze:

								                args[i] = args[i].unsqueeze(0)


								    result = func(*args)


								    if isinstance(result, tuple):

								        result = list(result)

								        for i, res in enumerate(result):

								            if type(res) == torch.Tensor:

								                if unsqueeze:

								                    res = res.squeeze(0)

								                result[i] = res.numpy()

								        return tuple(result)

								    elif type(result) == torch.Tensor:

								        if unsqueeze:

								            result = result.squeeze(0)

								        return result.numpy()

								    else:

								        return result


								def qrot(q, v):

								    assert q.shape[-1] == 4

								    assert v.shape[-1] == 3

								    assert q.shape[:-1] == v.shape[:-1]


								    qvec = q[..., 1:]

								    uv = torch.cross(qvec, v, dim=len(q.shape) - 1)

								    uuv = torch.cross(qvec, uv, dim=len(q.shape) - 1)

								    return (v + 2 * (q[..., :1] * uv + uuv))


								def qinverse(q, inplace=False):

								    if inplace:

								        q[..., 1:] *= -1

								        return q

								    else:

								        w = q[..., :1]

								        xyz = q[..., 1:]

								        return torch.cat((w, -xyz), dim=len(q.shape) - 1)


								def get_uvd2xyz(uvd, gt_3D, cam):

								    N, T, V,_ = uvd.size()


								    dec_out_all = uvd.view(-1, T, V, 3).clone()

								    root = gt_3D[:, :, 0, :].unsqueeze(-2).repeat(1, 1, V, 1).clone()

								    enc_in_all = uvd[:, :, :, :2].view(-1, T, V, 2).clone()


								    cam_f_all = cam[..., :2].view(-1,1,1,2).repeat(1,T,V,1)

								    cam_c_all = cam[..., 2:4].view(-1,1,1,2).repeat(1,T,V,1)


								    z_global = dec_out_all[:, :, :, 2]

								    z_global[:, :, 0] = root[:, :, 0, 2]

								    z_global[:, :, 1:] = dec_out_all[:, :, 1:, 2] + root[:, :, 1:, 2]

								    z_global = z_global.unsqueeze(-1)


								    uv = enc_in_all - cam_c_all

								    xy = uv * z_global.repeat(1, 1, 1, 2) / cam_f_all

								    xyz_global = torch.cat((xy, z_global), -1)

								    xyz_offset = (xyz_global - xyz_global[:, :, 0, :].unsqueeze(-2).repeat(1, 1, V, 1))


								    return xyz_offset