Changed init noise algorithm

author: Volpeon <git@volpeon.ink> 2023-03-03 23:37:40 +0100
committer: Volpeon <git@volpeon.ink> 2023-03-03 23:37:40 +0100
commit: 55fc031aebf48f22c9e646eb4d72246bfdbc5068 (patch)
tree: 318c1eb5351fd96a3b408d7baf0d5ee6adcefa69 /pipelines
parent: Removed offset noise from training, added init offset to pipeline (diff)
download: textual-inversion-diff-55fc031aebf48f22c9e646eb4d72246bfdbc5068.tar.gz
textual-inversion-diff-55fc031aebf48f22c9e646eb4d72246bfdbc5068.tar.bz2
textual-inversion-diff-55fc031aebf48f22c9e646eb4d72246bfdbc5068.zip
1 files changed, 11 insertions, 3 deletions
diff --git a/pipelines/stable_diffusion/vlpn_stable_diffusion.py b/pipelines/stable_diffusion/vlpn_stable_diffusion.py
index c4f7401..242be29 100644
--- a/pipelines/stable_diffusion/vlpn_stable_diffusion.py
+++ b/pipelines/stable_diffusion/vlpn_stable_diffusion.py
@@ -306,13 +306,19 @@ class VlpnStableDiffusion(DiffusionPipeline):
        return timesteps
-    def prepare_image(self, batch_size, width, height, dtype, device, generator=None):
+    def prepare_image(self, batch_size, width, height, max_offset, dtype, device, generator=None):
-        return torch.randn(
+        offset = (max_offset * (2 * torch.rand(
            (batch_size, 1, 1, 1),
            dtype=dtype,
            device=device,
            generator=generator
-        ).expand(batch_size, 3, width, height)
+        ) - 1)).expand(batch_size, 3, width, height)
+        image = (.1 * torch.normal(
+            mean=offset,
+            std=1,
+            generator=generator
+        )).clamp(-1, 1)
+        return image
    def prepare_latents(self, init_image, timestep, batch_size, dtype, device, generator=None):
        init_image = init_image.to(device=device, dtype=dtype)
@@ -376,6 +382,7 @@ class VlpnStableDiffusion(DiffusionPipeline):
        eta: float = 0.0,
        generator: Optional[Union[torch.Generator, List[torch.Generator]]] = None,
        image: Optional[Union[torch.FloatTensor, PIL.Image.Image]] = None,
+        max_image_offset: float = 1.0,
        output_type: str = "pil",
        return_dict: bool = True,
        callback: Optional[Callable[[int, int, torch.FloatTensor], None]] = None,
@@ -469,6 +476,7 @@ class VlpnStableDiffusion(DiffusionPipeline):
                batch_size * num_images_per_prompt,
                width,
                height,
+                max_image_offset,
                prompt_embeds.dtype,
                device,
                generator
author	Volpeon <git@volpeon.ink>	2023-03-03 23:37:40 +0100
committer	Volpeon <git@volpeon.ink>	2023-03-03 23:37:40 +0100
commit	55fc031aebf48f22c9e646eb4d72246bfdbc5068 (patch)
tree	318c1eb5351fd96a3b408d7baf0d5ee6adcefa69 /pipelines
parent	Removed offset noise from training, added init offset to pipeline (diff)
download	textual-inversion-diff-55fc031aebf48f22c9e646eb4d72246bfdbc5068.tar.gz textual-inversion-diff-55fc031aebf48f22c9e646eb4d72246bfdbc5068.tar.bz2 textual-inversion-diff-55fc031aebf48f22c9e646eb4d72246bfdbc5068.zip