123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778 |
- import torch
- import torch.nn as nn
- import numpy as np
- from einops import rearrange
- from deep_3drecon.util.mesh_renderer import MeshRenderer
- from deep_3drecon.deep_3drecon_models.bfm import ParametricFaceModel
- class SECC_Renderer(nn.Module):
- def __init__(self, rasterize_size=None, device="cuda"):
- super().__init__()
- self.face_model = ParametricFaceModel('deep_3drecon/BFM')
- self.fov = 2 * np.arctan(self.face_model.center / self.face_model.focal) * 180 / np.pi
- self.znear = 5.
- self.zfar = 15.
- if rasterize_size is None:
- rasterize_size = 2*self.face_model.center
- self.face_renderer = MeshRenderer(rasterize_fov=self.fov, znear=self.znear, zfar=self.zfar, rasterize_size=rasterize_size, use_opengl=False).cuda()
- face_feat = np.load("deep_3drecon/ncc_code.npy", allow_pickle=True)
- self.face_feat = torch.tensor(face_feat.T).unsqueeze(0).to(device=device)
- del_index_re = np.load('deep_3drecon/bfm_right_eye_faces.npy')
- del_index_re = del_index_re - 1
- del_index_le = np.load('deep_3drecon/bfm_left_eye_faces.npy')
- del_index_le = del_index_le - 1
- face_buf_list = []
- for i in range(self.face_model.face_buf.shape[0]):
- if i not in del_index_re and i not in del_index_le:
- face_buf_list.append(self.face_model.face_buf[i])
- face_buf_arr = np.array(face_buf_list)
- self.face_buf = torch.tensor(face_buf_arr).to(device=device)
-
- def forward(self, id, exp, euler, trans):
- """
- id, exp, euler, euler: [B, C] or [B, T, C]
- return:
- MASK: [B, 1, 512, 512], value[0. or 1.0], 1.0 denotes is face
- SECC MAP: [B, 3, 512, 512], value[0~1]
- if input is BTC format, return [B, C, T, H, W]
- """
- bs = id.shape[0]
- is_btc_flag = id.ndim == 3
- if is_btc_flag:
- t = id.shape[1]
- bs = bs * t
- id, exp, euler, trans = id.reshape([bs,-1]), exp.reshape([bs,-1]), euler.reshape([bs,-1]), trans.reshape([bs,-1])
- face_vertex = self.face_model.compute_face_vertex(id, exp, euler, trans)
- face_mask, _, secc_face = self.face_renderer(
- face_vertex, self.face_buf.unsqueeze(0).repeat([bs, 1, 1]), feat=self.face_feat.repeat([bs,1,1]))
- secc_face = (secc_face - 0.5) / 0.5 # scale to -1~1
- if is_btc_flag:
- bs = bs // t
- face_mask = rearrange(face_mask, "(n t) c h w -> n c t h w", n=bs, t=t)
- secc_face = rearrange(secc_face, "(n t) c h w -> n c t h w", n=bs, t=t)
- return face_mask, secc_face
- if __name__ == '__main__':
- import imageio
- renderer = SECC_Renderer(rasterize_size=512)
- ret = np.load("data/processed/videos/May/vid_coeff_fit.npy", allow_pickle=True).tolist()
- idx = 6
- id = torch.tensor(ret['id']).cuda()[idx:idx+1]
- exp = torch.tensor(ret['exp']).cuda()[idx:idx+1]
- angle = torch.tensor(ret['euler']).cuda()[idx:idx+1]
- trans = torch.tensor(ret['trans']).cuda()[idx:idx+1]
- mask, secc = renderer(id, exp, angle*0, trans*0) # [1, 1, 512, 512], [1, 3, 512, 512]
- out_mask = mask[0].permute(1,2,0)
- out_mask = (out_mask * 127.5 + 127.5).int().cpu().numpy()
- imageio.imwrite("out_mask.png", out_mask)
- out_img = secc[0].permute(1,2,0)
- out_img = (out_img * 127.5 + 127.5).int().cpu().numpy()
- imageio.imwrite("out_secc.png", out_img)
|