1 files changed, 9 insertions, 4 deletions
diff --git a/dreambooth.py b/dreambooth.py
index 96213d0..3eecf9c 100644
--- a/dreambooth.py
+++ b/dreambooth.py
@@ -130,6 +130,12 @@ def parse_args():
        help="The embeddings directory where Textual Inversion embeddings are stored.",
    )
    parser.add_argument(
+        "--mode",
+        type=str,
+        default=None,
+        help="A mode to filter the dataset.",
+    )
+    parser.add_argument(
        "--seed",
        type=int,
        default=None,
@@ -284,7 +290,7 @@ def parse_args():
    parser.add_argument(
        "--sample_frequency",
        type=int,
-        default=100,
+        default=1,
        help="How often to save a checkpoint and sample image",
    )
    parser.add_argument(
@@ -759,6 +765,7 @@ def main():
        num_class_images=args.num_class_images,
        size=args.resolution,
        repeats=args.repeats,
+        mode=args.mode,
        dropout=args.tag_dropout,
        center_crop=args.center_crop,
        template_key=args.train_data_template,
@@ -1046,7 +1053,7 @@ def main():
            unet.eval()
            text_encoder.eval()
-            with torch.autocast("cuda"), torch.inference_mode():
+            with torch.inference_mode():
                for step, batch in enumerate(val_dataloader):
                    latents = vae.encode(batch["pixel_values"]).latent_dist.sample()
                    latents = latents * 0.18215
@@ -1063,8 +1070,6 @@ def main():
                    model_pred = unet(noisy_latents, timesteps, encoder_hidden_states).sample
-                    model_pred, noise = accelerator.gather_for_metrics((model_pred, noise))
                    # Get the target for loss depending on the prediction type
                    if noise_scheduler.config.prediction_type == "epsilon":
                        target = noise