NimaGAN/frontalize_face.py at main · nima-kam/NimaGAN · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
# python3.7
"""
Manipulates the latent code to frontalize the generated face.

This file loads an initial latent code and a pre-trained neural
network classifier that predicts whether the corresponding face's
yaw angle is positive or negative on a scale of -90 to 90 degrees.
It uses these components to iteratively adjust the latent code
so that the final generated face is frontalized. The neural
network's gradient with respect to the input latent codes guides
the manipulation process. Optionally, a saved boundary for yaw
editing can also be used. The final adjusted latent code, which
generates a frontalized face, is saved for further use.
"""

import os.path
import torch
import argparse
from collections import defaultdict
import cv2
import numpy as np
from tqdm import tqdm
from utils.nl_manipulator import frontalize_latent,predict_yaw

from models.model_settings import MODEL_POOL
from models.pggan_generator import PGGANGenerator
from models.stylegan_generator import StyleGANGenerator
from models.stylegan2_generator import StyleGAN2Generator
from utils.logger import setup_logger

def parse_args():
    """Parses arguments."""
    parser = argparse.ArgumentParser(description='Generate images with given model and frontalize latent code.')
    parser.add_argument('-m', '--model_name', type=str, required=True,
                        choices=list(MODEL_POOL),
                        help='Name of the model for image generation. (required)')
    parser.add_argument('-o', '--output_dir', type=str, required=True,
                        help='Directory to save the output results. (required)')
    parser.add_argument('-l', '--latent_code_path', type=str, required=True,
                        help='Path to the initial latent code (.npy file). (required)')
    parser.add_argument('-b', '--boundary_path', type=str, default=None,
                        help='Path to the saved boundary for editing yaw (.npy file). (required)')
    parser.add_argument('-s', '--latent_space_type', type=str, default='z',
                        choices=['z', 'Z', 'w', 'W', 'wp', 'wP', 'Wp', 'WP'],
                        help='Latent space used in Style GAN. (default: `Z`)')
    parser.add_argument('-t', '--yaw_threshold', type=float, default=4.0,
                        help='Threshold for yaw angle to consider the image as frontal. (default: 4.0)')
    parser.add_argument('-i', '--max_iter', type=int, default=10,
                        help='Maximum number of iterations for adjustment. (default: 10)')
    parser.add_argument('-c', '--latent_classifier', required=True,
                        help='Path to pre-trained latent classifier .PKL file for using its gradient.')

    return parser.parse_args()


# Main function to execute the frontalization process
def main():
    """Main function."""
    args = parse_args()
    logger = setup_logger(args.output_dir, logger_name='generate_data')

    logger.info(f'Initializing generator.')
    gan_type = MODEL_POOL[args.model_name]['gan_type']
    if gan_type == 'pggan':
        model = PGGANGenerator(args.model_name, logger)
        kwargs = {}
    elif gan_type == 'stylegan':
        model = StyleGANGenerator(args.model_name, logger)
        kwargs = {'latent_space_type': args.latent_space_type}
    elif gan_type == 'stylegan2':
        model = StyleGAN2Generator(args.model_name, logger)
        kwargs = {'latent_space_type': args.latent_space_type}
    else:
        raise NotImplementedError(f'Not implemented GAN type `{gan_type}`!')

    # Load the initial latent code
    logger.info(f'Loading initial latent code from {args.latent_code_path}.')
    initial_latent = np.load(args.latent_code_path)

    logger.info(f'Loading yaw latent classifier from {args.latent_classifier}.')
    nn=torch.load(args.latent_classifier)
    # Load the yaw boundary
    if not (args.boundary_path is None):
        logger.info(f'Loading yaw boundary from {args.boundary_path}.')
        yaw_bound = np.load(args.boundary_path)


    # Perform frontalization
    logger.info(f'Performing frontalization.')
    final_latent, latent_list, yaw_list = frontalize_latent(
        start_latent=initial_latent,
        yaw_predict=predict_yaw,
        yaw_bound=yaw_bound,
        yaw_classifier=nn,
        generator=model,
        synthesis_kwargs=kwargs,
        max_iter=args.max_iter,
        yaw_thresh=args.yaw_threshold
    )

    # Save the final latent code
    final_latent_path = os.path.join(args.output_dir, os.path.basename(args.latent_code_path).replace('.npy', '_front.npy'))
    logger.info(f'Saving final latent code to {final_latent_path}.')
    np.save(final_latent_path, final_latent)

if __name__ == '__main__':
    main()