Small performance improvements

author: Volpeon <git@volpeon.ink> 2022-10-02 20:57:43 +0200
committer: Volpeon <git@volpeon.ink> 2022-10-02 20:57:43 +0200
commit: 64c594869135354a38353551bd58a93e15bd5b85 (patch)
tree: 2bcc085a396824f78e58c90b1f6e9553c7f5c8c1 /pipelines
parent: Fix img2img (diff)
download: textual-inversion-diff-64c594869135354a38353551bd58a93e15bd5b85.tar.gz
textual-inversion-diff-64c594869135354a38353551bd58a93e15bd5b85.tar.bz2
textual-inversion-diff-64c594869135354a38353551bd58a93e15bd5b85.zip
1 files changed, 10 insertions, 8 deletions
diff --git a/pipelines/stable_diffusion/vlpn_stable_diffusion.py b/pipelines/stable_diffusion/vlpn_stable_diffusion.py
index b4c85e9..8fbe5f9 100644
--- a/pipelines/stable_diffusion/vlpn_stable_diffusion.py
+++ b/pipelines/stable_diffusion/vlpn_stable_diffusion.py
@@ -223,15 +223,16 @@ class VlpnStableDiffusion(DiffusionPipeline):
        # Unlike in other pipelines, latents need to be generated in the target device
        # for 1-to-1 results reproducibility with the CompVis implementation.
        # However this currently doesn't work in `mps`.
-        latents_device = "cpu" if self.device.type == "mps" else self.device
+        latents_dtype = text_embeddings.dtype
        latents_shape = (batch_size, self.unet.in_channels, height // 8, width // 8)
        if latents is None:
-            latents = torch.randn(
+            if self.device.type == "mps":
-                latents_shape,
+                # randn does not exist on mps
-                generator=generator,
+                latents = torch.randn(latents_shape, generator=generator, device="cpu", dtype=latents_dtype).to(
-                device=latents_device,
+                    self.device
-                dtype=text_embeddings.dtype,
+                )
-            )
+            else:
+                latents = torch.randn(latents_shape, generator=generator, device=self.device, dtype=latents_dtype)
        elif isinstance(latents, PIL.Image.Image):
            latents = preprocess(latents, width, height)
            latent_dist = self.vae.encode(latents.to(self.device)).latent_dist
@@ -259,7 +260,8 @@ class VlpnStableDiffusion(DiffusionPipeline):
        else:
            if latents.shape != latents_shape:
                raise ValueError(f"Unexpected latents shape, got {latents.shape}, expected {latents_shape}")
-            latents = latents.to(self.device)
+            if latents.device != self.device:
+                raise ValueError(f"Unexpected latents device, got {latents.device}, expected {self.device}")
        # if we use LMSDiscreteScheduler, let's make sure latents are multiplied by sigmas
        if ensure_sigma:
author	Volpeon <git@volpeon.ink>	2022-10-02 20:57:43 +0200
committer	Volpeon <git@volpeon.ink>	2022-10-02 20:57:43 +0200
commit	64c594869135354a38353551bd58a93e15bd5b85 (patch)
tree	2bcc085a396824f78e58c90b1f6e9553c7f5c8c1 /pipelines
parent	Fix img2img (diff)
download	textual-inversion-diff-64c594869135354a38353551bd58a93e15bd5b85.tar.gz textual-inversion-diff-64c594869135354a38353551bd58a93e15bd5b85.tar.bz2 textual-inversion-diff-64c594869135354a38353551bd58a93e15bd5b85.zip