|
|
|
|
|
from __future__ import annotations |
|
|
|
import argparse |
|
import functools |
|
import os |
|
import pickle |
|
import sys |
|
|
|
import gradio as gr |
|
import numpy as np |
|
import torch |
|
import torch.nn as nn |
|
from huggingface_hub import hf_hub_download |
|
|
|
sys.path.insert(0, 'stylegan3') |
|
|
|
ORIGINAL_REPO_URL = 'https://github.com/NVlabs/stylegan3' |
|
TITLE = 'NVlabs/stylegan3' |
|
DESCRIPTION = f'This is a demo for {ORIGINAL_REPO_URL}.' |
|
SAMPLE_IMAGE_DIR = 'https://huggingface.co./spaces/hysts/StyleGAN3/resolve/main/samples' |
|
ARTICLE = f'''## Generated images |
|
- truncation: 0.7 |
|
### AFHQv2 |
|
- size: 512x512 |
|
- seed: 0-99 |
|
![AFHQv2 samples]({SAMPLE_IMAGE_DIR}/afhqv2.jpg) |
|
### FFHQ |
|
- size: 1024x1024 |
|
- seed: 0-99 |
|
![FFHQ samples]({SAMPLE_IMAGE_DIR}/ffhq.jpg) |
|
### FFHQ-U |
|
- size: 1024x1024 |
|
- seed: 0-99 |
|
![FFHQ-U samples]({SAMPLE_IMAGE_DIR}/ffhq-u.jpg) |
|
### MetFaces |
|
- size: 1024x1024 |
|
- seed: 0-99 |
|
![MetFaces samples]({SAMPLE_IMAGE_DIR}/metfaces.jpg) |
|
### MetFaces-U |
|
- size: 1024x1024 |
|
- seed: 0-99 |
|
![MetFaces-U samples]({SAMPLE_IMAGE_DIR}/metfaces-u.jpg) |
|
''' |
|
|
|
TOKEN = os.environ['TOKEN'] |
|
|
|
|
|
def parse_args() -> argparse.Namespace: |
|
parser = argparse.ArgumentParser() |
|
parser.add_argument('--device', type=str, default='cpu') |
|
parser.add_argument('--theme', type=str) |
|
parser.add_argument('--live', action='store_true') |
|
parser.add_argument('--share', action='store_true') |
|
parser.add_argument('--port', type=int) |
|
parser.add_argument('--disable-queue', |
|
dest='enable_queue', |
|
action='store_false') |
|
parser.add_argument('--allow-flagging', type=str, default='never') |
|
parser.add_argument('--allow-screenshot', action='store_true') |
|
return parser.parse_args() |
|
|
|
|
|
def make_transform(translate: tuple[float, float], angle: float) -> np.ndarray: |
|
mat = np.eye(3) |
|
sin = np.sin(angle / 360 * np.pi * 2) |
|
cos = np.cos(angle / 360 * np.pi * 2) |
|
mat[0][0] = cos |
|
mat[0][1] = sin |
|
mat[0][2] = translate[0] |
|
mat[1][0] = -sin |
|
mat[1][1] = cos |
|
mat[1][2] = translate[1] |
|
return mat |
|
|
|
|
|
def generate_z(z_dim: int, seed: int, device: torch.device) -> torch.Tensor: |
|
return torch.from_numpy(np.random.RandomState(seed).randn( |
|
1, z_dim)).to(device).float() |
|
|
|
|
|
@torch.inference_mode() |
|
def generate_image(model_name: str, seed: int, truncation_psi: float, |
|
tx: float, ty: float, angle: float, |
|
model_dict: dict[str, nn.Module], |
|
device: torch.device) -> np.ndarray: |
|
model = model_dict[model_name] |
|
seed = int(np.clip(seed, 0, np.iinfo(np.uint32).max)) |
|
|
|
z = generate_z(model.z_dim, seed, device) |
|
label = torch.zeros([1, model.c_dim], device=device) |
|
|
|
mat = make_transform((tx, ty), angle) |
|
mat = np.linalg.inv(mat) |
|
model.synthesis.input.transform.copy_(torch.from_numpy(mat)) |
|
|
|
out = model(z, label, truncation_psi=truncation_psi) |
|
out = (out.permute(0, 2, 3, 1) * 127.5 + 128).clamp(0, 255).to(torch.uint8) |
|
return out[0].cpu().numpy() |
|
|
|
|
|
def load_model(file_name: str, device: torch.device) -> nn.Module: |
|
path = hf_hub_download('hysts/StyleGAN3', |
|
f'models/{file_name}', |
|
use_auth_token=TOKEN) |
|
with open(path, 'rb') as f: |
|
model = pickle.load(f)['G_ema'] |
|
model.eval() |
|
model.to(device) |
|
with torch.inference_mode(): |
|
z = torch.zeros((1, model.z_dim)).to(device) |
|
label = torch.zeros([1, model.c_dim], device=device) |
|
model(z, label) |
|
return model |
|
|
|
|
|
def main(): |
|
args = parse_args() |
|
device = torch.device(args.device) |
|
|
|
model_names = { |
|
'AFHQv2-512-R': 'stylegan3-r-afhqv2-512x512.pkl', |
|
'FFHQ-1024-R': 'stylegan3-r-ffhq-1024x1024.pkl', |
|
'FFHQ-U-256-R': 'stylegan3-r-ffhqu-256x256.pkl', |
|
'FFHQ-U-1024-R': 'stylegan3-r-ffhqu-1024x1024.pkl', |
|
'MetFaces-1024-R': 'stylegan3-r-metfaces-1024x1024.pkl', |
|
'MetFaces-U-1024-R': 'stylegan3-r-metfacesu-1024x1024.pkl', |
|
'AFHQv2-512-T': 'stylegan3-t-afhqv2-512x512.pkl', |
|
'FFHQ-1024-T': 'stylegan3-t-ffhq-1024x1024.pkl', |
|
'FFHQ-U-256-T': 'stylegan3-t-ffhqu-256x256.pkl', |
|
'FFHQ-U-1024-T': 'stylegan3-t-ffhqu-1024x1024.pkl', |
|
'MetFaces-1024-T': 'stylegan3-t-metfaces-1024x1024.pkl', |
|
'MetFaces-U-1024-T': 'stylegan3-t-metfacesu-1024x1024.pkl', |
|
} |
|
|
|
model_dict = { |
|
name: load_model(file_name, device) |
|
for name, file_name in model_names.items() |
|
} |
|
|
|
func = functools.partial(generate_image, |
|
model_dict=model_dict, |
|
device=device) |
|
func = functools.update_wrapper(func, generate_image) |
|
|
|
gr.Interface( |
|
func, |
|
[ |
|
gr.inputs.Radio(list(model_names.keys()), |
|
type='value', |
|
default='FFHQ-1024-R', |
|
label='Model'), |
|
gr.inputs.Number(default=0, label='Seed'), |
|
gr.inputs.Slider( |
|
0, 2, step=0.05, default=0.7, label='Truncation psi'), |
|
gr.inputs.Slider(-1, 1, step=0.05, default=0, label='Translate X'), |
|
gr.inputs.Slider(-1, 1, step=0.05, default=0, label='Translate Y'), |
|
gr.inputs.Slider(-180, 180, step=5, default=0, label='Angle'), |
|
], |
|
gr.outputs.Image(type='numpy', label='Output'), |
|
title=TITLE, |
|
description=DESCRIPTION, |
|
article=ARTICLE, |
|
theme=args.theme, |
|
allow_screenshot=args.allow_screenshot, |
|
allow_flagging=args.allow_flagging, |
|
live=args.live, |
|
).launch( |
|
enable_queue=args.enable_queue, |
|
server_port=args.port, |
|
share=args.share, |
|
) |
|
|
|
|
|
if __name__ == '__main__': |
|
main() |
|
|