demo.py

"""
ProHMR demo script.
To run our method you need a folder with images and corresponding OpenPose detections.
These are used to crop the images around the humans and optionally to fit the SMPL model on the detections.

Example usage:
python demo.py --checkpoint=path/to/checkpoint.pt --img_folder=/path/to/images --keypoint_folder=/path/to/json --out_folder=/path/to/output --run_fitting

Running the above will run inference for all images in /path/to/images with corresponding keypoint detections.
The rendered results will be saved to /path/to/output, with the suffix _regression.jpg for the regression (mode) and _fitting.jpg for the fitting.

Please keep in mind that we do not recommend to use `--full_frame` when the image resolution is above 2K because of known issues with the data term of SMPLify.
In these cases you can resize all images such that the maximum image dimension is at most 2K.
"""
import torch
import argparse
import os
import cv2
from tqdm import tqdm

from prohmr.configs import get_config, prohmr_config, dataset_config
from prohmr.models import ProHMR, SMPL
from prohmr.optimization import KeypointFitting, MultiviewRefinement
from prohmr.utils import recursive_to
from prohmr.datasets import OpenPoseDataset
from prohmr.utils.renderer import Renderer

parser = argparse.ArgumentParser(description='ProHMR demo code')
parser.add_argument('--checkpoint', type=str, default='data/checkpoint.pt', help='Path to pretrained model checkpoint')
parser.add_argument('--model_cfg', type=str, default=None,
                    help='Path to config file. If not set use the default (prohmr/configs/prohmr.yaml)')
parser.add_argument('--img_folder', type=str, required=True, help='Folder with input images')
parser.add_argument('--keypoint_folder', type=str, required=True, help='Folder with corresponding OpenPose detections')
parser.add_argument('--out_folder', type=str, default='demo_out', help='Output folder to save rendered results')
parser.add_argument('--out_format', type=str, default='jpg', choices=['jpg', 'png'], help='Output image format')
parser.add_argument('--run_fitting', dest='run_fitting', action='store_true', default=False,
                    help='If set, run fitting on top of regression')
parser.add_argument('--run_multiview', dest='run_multiview', action='store_true', default=False,
                    help='If set, run multi view fitting on top of regression')
parser.add_argument('--write_image', dest="write_image", default=True, help='Batch size for inference/fitting')
parser.add_argument('--full_frame', dest='full_frame', action='store_true', default=False,
                    help='If set, run fitting in the original image space and not in the crop.')
parser.add_argument('--batch_size', type=int, default=1, help='Batch size for inference/fitting')

args = parser.parse_args()

# Use the GPU if available
device = torch.device('cuda') if torch.cuda.is_available() else torch.device('cpu')
if args.model_cfg is None:
    model_cfg = prohmr_config()
else:
    model_cfg = get_config(args.model_cfg)

# Setup model
model = ProHMR.load_from_checkpoint(args.checkpoint, strict=False, cfg=model_cfg).to(device)
model.eval()

# Init Optimizations
optimize = None
if args.run_fitting:
    optimize = KeypointFitting(model_cfg)
if args.run_multiview:
    optimize = MultiviewRefinement(model_cfg)

# Create a dataset on-the-fly
dataset = OpenPoseDataset(model_cfg, img_folder=args.img_folder, keypoint_folder=args.keypoint_folder,
                          max_people_per_image=1)

# Setup a dataloader with batch_size = 1 (Process images sequentially)
dataloader = torch.utils.data.DataLoader(dataset, args.batch_size, shuffle=False)

# Setup the renderer
renderer = Renderer(model_cfg, faces=model.smpl.faces)
write_image = args.write_image

if not os.path.exists(args.out_folder):
    os.makedirs(args.out_folder)

multiview_dict = {}

# Go over each image in the dataset
for i, batch in enumerate(tqdm(dataloader)):

    batch = recursive_to(batch, device)
    with torch.no_grad():

        out = model(batch)
        simp = out['smpl_output']
        # We have access to smpl here
        # a = out['pred_smpl_params']['betas']
        # b = out['pred_vertices']
        with open(args.out_folder + "/posed.obj", 'w') as fp:
            for v in simp.vertices.detach().cpu().numpy()[0]:
                fp.write('v %f %f %f\n' % (v[0], v[1], v[2]))
            for f in model.smpl.faces + 1:
                fp.write('f %d %d %d\n' % (f[0], f[1], f[2]))

        # Ensure Path
        # with open(args.out_folder + "posed.obj", 'w') as fp:
        #     for v in simp.vertices.detach().cpu().numpy()[0]:
        #         fp.write('v %f %f %f\n' % (v[0], v[1], v[2]))
        #     for f in model.smpl.faces + 1:
        #         fp.write('f %d %d %d\n' % (f[0], f[1], f[2]))

    batch_size = batch['img'].shape[0]

    # Write out image
    if write_image:
        for n in range(batch_size):
            img_fn, _ = os.path.splitext(os.path.split(batch['imgname'][n])[1])
            regression_img = renderer(out['pred_vertices'][n, 0].detach().cpu().numpy(),
                                      out['pred_cam_t'][n, 0].detach().cpu().numpy(),
                                      batch['img'][n])
            cv2.imwrite(os.path.join(args.out_folder, f'{img_fn}_regression.{args.out_format}'),
                        255 * regression_img[:, :, ::-1])

    if args.run_fitting or args.run_multiview:
        opt_out = model.downstream_optimization(regression_output=out,
                                                batch=batch,
                                                opt_task=optimize,
                                                use_hips=False,
                                                full_frame=args.full_frame)

        simp = opt_out['smpl_output']
        # opt_output['smpl_params']['betas']
        # opt_output['model_joints'] = model_joints
        # opt_output['vertices'] = vertices

        # write out smpl_betas/ verts
        with open(args.out_folder + "/posed_optimization.obj", 'w') as fp:
            for v in simp.vertices.detach().cpu().numpy()[0]:
                fp.write('v %f %f %f\n' % (v[0], v[1], v[2]))
            for f in model.smpl.faces + 1:
                fp.write('f %d %d %d\n' % (f[0], f[1], f[2]))

        # with open(args.out_folder + "optimization.obj", 'w') as fp:
        #     for v in simp.vertices.detach().cpu().numpy()[0]:
        #         fp.write('v %f %f %f\n' % (v[0], v[1], v[2]))
        #     for f in model.smpl.faces + 1:
        #         fp.write('f %d %d %d\n' % (f[0], f[1], f[2]))

        # Write out image
        if write_image:
            for n in range(batch_size):
                img_fn, _ = os.path.splitext(os.path.split(batch['imgname'][n])[1])
                fitting_img = renderer(opt_out['vertices'][n].detach().cpu().numpy(),
                                       opt_out['camera_translation'][n].detach().cpu().numpy(),
                                       batch['img'][n], imgname=batch['imgname'][n], full_frame=args.full_frame)
                cv2.imwrite(os.path.join(args.out_folder, f'{img_fn}_fitting.{args.out_format}'),
                            255 * fitting_img[:, :, ::-1])

    # Multiview fitting
    # if args.run_multiview:
    #   opt_out = model.downstream_optimization()