import torch from timm.models import ConvNeXt from timm.data.constants import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD from torch.nn import functional as F class ConvNeXtDiscriminator: def __init__(self, model: ConvNeXt, input_size: int) -> None: self.net = model self.input_size = input_size self.img_mean = torch.tensor(IMAGENET_DEFAULT_MEAN).view(1, -1, 1, 1) self.img_std = torch.tensor(IMAGENET_DEFAULT_STD).view(1, -1, 1, 1) def get_score(self, img): pred = self.get_all(img) return torch.softmax(pred, dim=-1)[:, 1] def get_all(self, img): img_mean = self.img_mean.to(device=img.device, dtype=img.dtype) img_std = self.img_std.to(device=img.device, dtype=img.dtype) img = ((img + 1.0) / 2.0).sub(img_mean).div(img_std) img = F.interpolate( img, size=(self.input_size, self.input_size), mode="bicubic", align_corners=True, ) pred = self.net(img) return pred