import os import pathlib import shlex import subprocess import sys import huggingface_hub import numpy as np import torch from torch import nn if os.getenv("SYSTEM") == "spaces": subprocess.run(shlex.split("sed -i '14,21d' StyleSwin/op/fused_act.py"), check=False) # noqa: S603 subprocess.run(shlex.split("sed -i '12,19d' StyleSwin/op/upfirdn2d.py"), check=False) # noqa: S603 current_dir = pathlib.Path(__file__).parent submodule_dir = current_dir / "StyleSwin" sys.path.insert(0, submodule_dir.as_posix()) from models.generator import Generator # noqa: E402 # pyright: ignore[reportMissingImports] class Model: MODEL_NAMES = ( "CelebAHQ_256", "FFHQ_256", "LSUNChurch_256", "CelebAHQ_1024", "FFHQ_1024", ) def __init__(self) -> None: self.device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu") self._download_all_models() self.model_name = self.MODEL_NAMES[3] self.model = self._load_model(self.model_name) self.std = torch.FloatTensor([0.229, 0.224, 0.225])[None, :, None, None].to(self.device) self.mean = torch.FloatTensor([0.485, 0.456, 0.406])[None, :, None, None].to(self.device) def _load_model(self, model_name: str) -> nn.Module: size = int(model_name.split("_")[1]) channel_multiplier = 1 if size == 1024 else 2 # noqa: PLR2004 model = Generator(size, style_dim=512, n_mlp=8, channel_multiplier=channel_multiplier) ckpt_path = huggingface_hub.hf_hub_download("public-data/StyleSwin", f"models/{model_name}.pt") ckpt = torch.load(ckpt_path) model.load_state_dict(ckpt["g_ema"]) model.to(self.device) model.eval() return model def set_model(self, model_name: str) -> None: if model_name == self.model_name: return self.model_name = model_name self.model = self._load_model(model_name) def _download_all_models(self) -> None: for name in self.MODEL_NAMES: self._load_model(name) def generate_z(self, seed: int) -> torch.Tensor: seed = int(np.clip(seed, 0, np.iinfo(np.uint32).max)) z = np.random.RandomState(seed).randn(1, 512) return torch.from_numpy(z).float().to(self.device) def postprocess(self, tensors: torch.Tensor) -> np.ndarray: if not tensors.dim() == 4: # noqa: PLR2004 raise ValueError("tensors must be 4-dimensional") tensors = tensors * self.std + self.mean tensors = (tensors * 255).clamp(0, 255).to(torch.uint8) return tensors.permute(0, 2, 3, 1).cpu().numpy() @torch.inference_mode() def generate_image(self, seed: int) -> np.ndarray: z = self.generate_z(seed) out, _ = self.model(z) out = self.postprocess(out) return out[0] def set_model_and_generate_image(self, model_name: str, seed: int) -> np.ndarray: self.set_model(model_name) return self.generate_image(seed)