From 55fc031aebf48f22c9e646eb4d72246bfdbc5068 Mon Sep 17 00:00:00 2001 From: Volpeon Date: Fri, 3 Mar 2023 23:37:40 +0100 Subject: Changed init noise algorithm --- pipelines/stable_diffusion/vlpn_stable_diffusion.py | 14 +++++++++++--- 1 file changed, 11 insertions(+), 3 deletions(-) (limited to 'pipelines') diff --git a/pipelines/stable_diffusion/vlpn_stable_diffusion.py b/pipelines/stable_diffusion/vlpn_stable_diffusion.py index c4f7401..242be29 100644 --- a/pipelines/stable_diffusion/vlpn_stable_diffusion.py +++ b/pipelines/stable_diffusion/vlpn_stable_diffusion.py @@ -306,13 +306,19 @@ class VlpnStableDiffusion(DiffusionPipeline): return timesteps - def prepare_image(self, batch_size, width, height, dtype, device, generator=None): - return torch.randn( + def prepare_image(self, batch_size, width, height, max_offset, dtype, device, generator=None): + offset = (max_offset * (2 * torch.rand( (batch_size, 1, 1, 1), dtype=dtype, device=device, generator=generator - ).expand(batch_size, 3, width, height) + ) - 1)).expand(batch_size, 3, width, height) + image = (.1 * torch.normal( + mean=offset, + std=1, + generator=generator + )).clamp(-1, 1) + return image def prepare_latents(self, init_image, timestep, batch_size, dtype, device, generator=None): init_image = init_image.to(device=device, dtype=dtype) @@ -376,6 +382,7 @@ class VlpnStableDiffusion(DiffusionPipeline): eta: float = 0.0, generator: Optional[Union[torch.Generator, List[torch.Generator]]] = None, image: Optional[Union[torch.FloatTensor, PIL.Image.Image]] = None, + max_image_offset: float = 1.0, output_type: str = "pil", return_dict: bool = True, callback: Optional[Callable[[int, int, torch.FloatTensor], None]] = None, @@ -469,6 +476,7 @@ class VlpnStableDiffusion(DiffusionPipeline): batch_size * num_images_per_prompt, width, height, + max_image_offset, prompt_embeds.dtype, device, generator -- cgit v1.2.3-54-g00ecf