add extra global orientation step

2025-10-16 11:45:42 +00:00 · 2021-02-22 19:06:59 +01:00 · 2021-02-22 19:06:59 +01:00 · 9cab019d24
commit 9cab019d24
parent a0f594bf2c
3 changed files with 226 additions and 30 deletions
--- a/train.py
+++ b/train.py
@ -1,7 +1,12 @@
 # library imports
+from collections import defaultdict
+import numpy as np
+from modules.camera import SimpleCamera
+from train_orient import train_orient_with_conf
 from modules.utils import is_loss_enabled, toggle_loss_enabled
 import os
 import pickle
+import cv2
 import torch
 from tqdm.auto import trange

@ -15,7 +20,7 @@ from camera_estimation import TorchCameraEstimate

 def optimize_sample(sample_index, dataset, config, device=torch.device('cpu'), dtype=torch.float32, interactive=True, offscreen=False, verbose=True, initial_pose=None):
    # prepare data and SMPL model
-    model = SMPLyModel.model_from_conf(config, initial_pose=initial_pose)
+    model = SMPLyModel.model_from_conf(config)
    init_keypoints, init_joints, keypoints, conf, est_scale, r, img_path = setup_training(
        model=model,
        renderer=interactive,
@ -47,13 +52,49 @@ def optimize_sample(sample_index, dataset, config, device=torch.device('cpu'), d
        change_loss_disabled = True
        toggle_loss_enabled(config, 'changeLoss', False)

+    # configure PyTorch device and format
+    # dtype = torch.float64
+    if 'device' in config['pose'] is not None:
+        device = torch.device(config['pose']['device'])
+    else:
+        device = torch.device('cpu')
+
+    # get camera estimation
+    pose_camera, cam_trans, cam_int, cam_params = SimpleCamera.from_estimation_cam(
+        cam=camera,
+        use_intrinsics=config['pose']['useCameraIntrinsics'],
+        dtype=dtype,
+        device=device,
+    )
+
+    params = defaultdict(
+        body_pose=initial_pose,
+    )
+
+    model(**params)
+
+    # apply transform to scene
+    if r is not None:
+        r.set_group_pose("body", cam_trans.cpu().numpy())
+
+    global_orient = train_orient_with_conf(
+        config=config,
+        model=model,
+        keypoints=keypoints,
+        camera_layer=pose_camera,
+        renderer=r,
+        device=device,
+        use_progress_bar=verbose,
+        render_steps=(offscreen or interactive)
+    )
+
    # train for pose
-    best_out, cam_trans, loss_history, step_imgs, loss_components = train_pose_with_conf(
+    best_out, loss_history, step_imgs, loss_components = train_pose_with_conf(
        config=config,
        model=model,
        keypoints=keypoints,
        keypoint_conf=conf,
-        camera=camera,
+        pose_camera=pose_camera,
        renderer=r,
        device=device,
        use_progress_bar=verbose,
--- a/train_orient.py
+++ b/train_orient.py
@ -0,0 +1,179 @@
+from utils.mapping import get_indices_by_name
+from modules.distance_loss import WeightedMSELoss
+from modules.utils import get_loss_layers
+from camera_estimation import TorchCameraEstimate
+import smplx
+import torch
+import torch.nn as nn
+from tqdm import tqdm
+import torchgeometry as tgm
+
+# internal imports
+from modules.pose import BodyPose
+from modules.filter import JointFilter
+from modules.camera import SimpleCamera
+from renderer import Renderer
+
+
+def train_orient(
+    model: smplx.SMPL,
+    # current datapoints
+    keypoints,
+    # 3D to 2D camera layer
+    camera: SimpleCamera,
+
+    # pytorch config
+    device=torch.device('cuda'),
+    dtype=torch.float32,
+
+    # optimizer settings
+    optimizer=None,
+    optimizer_type="Adam",
+    learning_rate=1e-3,
+    iterations=60,
+    patience=10,
+
+    joint_names=["hip-left", "hip-right",
+                   "shoulder-left", "shoulder-right"],
+
+    # renderer options
+    renderer: Renderer = None,
+    render_steps=True,
+
+    use_progress_bar=True,
+):
+    if use_progress_bar:
+        print("[pose] starting training")
+        print("[pose] dtype=", dtype, device)
+
+    loss_layer = torch.nn.MSELoss(reduction="sum").to(
+        device=device,
+        dtype=dtype
+    )
+
+    # make sure camera module is on the correct device
+    camera = camera.to(device=device, dtype=dtype)
+
+    # setup keypoint data
+    keypoints = torch.tensor(keypoints).to(device=device, dtype=dtype)
+
+    # torso indices
+    torso_indices = get_indices_by_name(joint_names)
+
+    torso_indices = torch.tensor(
+        torso_indices, dtype=torch.int64, device=device).reshape(4)
+
+    # setup torch modules
+    pose_layer = BodyPose(model, dtype=dtype, device=device,
+                          useBodyMeanAngles=False).to(device=device, dtype=dtype)
+
+    parameters = [model.global_orient]
+
+    if use_progress_bar:
+        pbar = tqdm(total=iterations)
+
+    # store results for optional plotting
+    cur_patience = patience
+    best_loss = None
+    best_output = None
+
+    if optimizer is None:
+        if optimizer_type.lower() == "lbfgs":
+            optimizer = torch.optim.LBFGS
+        elif optimizer_type.lower() == "adam":
+            optimizer = torch.optim.Adam
+
+    optimizer = optimizer(parameters, learning_rate)
+
+    # prediction and loss computation closere
+    def predict():
+        # return joints based on current model state
+        body_joints, cur_pose = pose_layer()
+
+        # compute homogeneous coordinates and project them to 2D space
+        points = tgm.convert_points_to_homogeneous(body_joints)
+        points = camera(points).squeeze()
+
+        # compute loss between 2D joint projection and OpenPose keypoints
+        loss = loss_layer(points[torso_indices],
+                          keypoints[torso_indices])
+
+        return loss
+
+    # main optimizer closure
+    def optim_closure():
+        if torch.is_grad_enabled():
+            optimizer.zero_grad()
+
+        loss = predict()
+
+        if loss.requires_grad:
+            loss.backward()
+        return loss
+
+    # camera translation
+    R = camera.trans.detach().cpu().numpy().squeeze()
+
+    # main optimization loop
+    for t in range(iterations):
+        loss = optimizer.step(optim_closure)
+
+        # compute loss
+        cur_loss = loss.item()
+
+        if best_loss is None:
+            best_loss = cur_loss
+        elif cur_loss < best_loss:
+            best_loss = cur_loss
+            best_output = pose_layer.cur_out
+        else:
+            cur_patience = cur_patience - 1
+
+        if patience == 0:
+            print("[train] aborted due to patience limit reached")
+
+        if use_progress_bar:
+            pbar.set_description("Error %f" % cur_loss)
+            pbar.update(1)
+
+        if renderer is not None and render_steps:
+            renderer.render_model(
+                model=model,
+                model_out=pose_layer.cur_out,
+                transform=R
+            )
+
+    if use_progress_bar:
+        pbar.close()
+        print("Final result:", loss.item())
+    return best_output
+
+
+def train_orient_with_conf(
+    config,
+    camera_layer: TorchCameraEstimate,
+    model: smplx.SMPL,
+    keypoints,
+    device=torch.device('cpu'),
+    dtype=torch.float32,
+    renderer: Renderer = None,
+    render_steps=True,
+    use_progress_bar=True,
+):
+
+    best_output = train_orient(
+        model=model.to(dtype=dtype),
+        keypoints=keypoints,
+        camera=camera_layer,
+        device=device,
+        dtype=dtype,
+        renderer=renderer,
+        joint_names=config['orientation']['joint_names'],
+        optimizer_type=config['orientation']['optimizer'],
+        iterations=config['orientation']['iterations'],
+        learning_rate=config['orientation']['lr'],
+        render_steps=render_steps,
+        use_progress_bar=use_progress_bar,
+    )
+
+    return best_output.global_orient
--- a/train_pose.py
+++ b/train_pose.py
@ -85,8 +85,7 @@ def train_pose(
    pose_layer = BodyPose(model, dtype=dtype, device=device,
                          useBodyMeanAngles=False).to(device=device, dtype=dtype)

-    # [model.global_orient, pose_layer.body_pose]
-    parameters = [pose_layer.body_pose]  # list(model.parameters())
+    parameters = [pose_layer.body_pose]

    # setup all loss layers
    for l in extra_loss_layers:
@ -198,7 +197,7 @@ def train_pose(

 def train_pose_with_conf(
    config,
-    camera: TorchCameraEstimate,
+    pose_camera,
    model: smplx.SMPL,
    keypoints,
    keypoint_conf,
@ -209,29 +208,6 @@ def train_pose_with_conf(
    use_progress_bar=True,
    print_loss_layers=False
 ):
-
-    # configure PyTorch device and format
-    # dtype = torch.float64
-    if 'device' in config['pose'] is not None:
-        device = torch.device(config['pose']['device'])
-    else:
-        device = torch.device('cpu')
-
-    # create camera module
-    pose_camera, cam_trans, cam_int, cam_params = SimpleCamera.from_estimation_cam(
-        cam=camera,
-        use_intrinsics=config['pose']['useCameraIntrinsics'],
-        dtype=dtype,
-        device=device,
-    )
-
-    # pose_camera, cam_trans = SimpleCamera.dummy_camera(
-    #     device=device, dtype=dtype)
-
-    # apply transform to scene
-    if renderer is not None:
-        renderer.set_group_pose("body", cam_trans.cpu().numpy())
-
    loss_layers = get_loss_layers(config, model, device, dtype)

    if print_loss_layers:
@ -254,4 +230,4 @@ def train_pose_with_conf(
        extra_loss_layers=loss_layers
    )

-    return best_output, cam_trans, loss_history, offscreen_step_output, loss_components
+    return best_output, loss_history, offscreen_step_output, loss_components