Fixed Lora training

author: Volpeon <git@volpeon.ink> 2023-02-08 07:27:55 +0100
committer: Volpeon <git@volpeon.ink> 2023-02-08 07:27:55 +0100
commit: 9ea20241bbeb2f32199067096272e13647c512eb (patch)
tree: 9e0891a74d0965da75e9d3f30628b69d5ba3deaf /train_lora.py
parent: Fix Lora memory usage (diff)
download: textual-inversion-diff-9ea20241bbeb2f32199067096272e13647c512eb.tar.gz
textual-inversion-diff-9ea20241bbeb2f32199067096272e13647c512eb.tar.bz2
textual-inversion-diff-9ea20241bbeb2f32199067096272e13647c512eb.zip
1 files changed, 18 insertions, 7 deletions
diff --git a/train_lora.py b/train_lora.py
index b273ae1..ab1753b 100644
--- a/train_lora.py
+++ b/train_lora.py
@@ -13,7 +13,7 @@ from accelerate.logging import get_logger
 from accelerate.utils import LoggerType, set_seed
 from slugify import slugify
 from diffusers.loaders import AttnProcsLayers
-from diffusers.models.cross_attention import LoRAXFormersCrossAttnProcessor
+from diffusers.models.cross_attention import LoRAXFormersCrossAttnProcessor, LoRACrossAttnProcessor
 from util import load_config, load_embeddings_from_dir
 from data.csv import VlpnDataModule, keyword_filter
@@ -178,6 +178,11 @@ def parse_args():
        help="Number of updates steps to accumulate before performing a backward/update pass.",
    )
    parser.add_argument(
+        "--gradient_checkpointing",
+        action="store_true",
+        help="Whether or not to use gradient checkpointing to save memory at the expense of slower backward pass.",
+    )
+    parser.add_argument(
        "--find_lr",
        action="store_true",
        help="Automatically find a learning rate (no training).",
@@ -402,6 +407,12 @@ def main():
        mixed_precision=args.mixed_precision
    )
+    weight_dtype = torch.float32
+    if args.mixed_precision == "fp16":
+        weight_dtype = torch.float16
+    elif args.mixed_precision == "bf16":
+        weight_dtype = torch.bfloat16
    logging.basicConfig(filename=output_dir.joinpath("log.txt"), level=logging.DEBUG)
    if args.seed is None:
@@ -418,6 +429,12 @@ def main():
    vae.set_use_memory_efficient_attention_xformers(True)
    unet.enable_xformers_memory_efficient_attention()
+    if args.gradient_checkpointing:
+        unet.enable_gradient_checkpointing()
+    unet.to(accelerator.device, dtype=weight_dtype)
+    text_encoder.to(accelerator.device, dtype=weight_dtype)
    lora_attn_procs = {}
    for name in unet.attn_processors.keys():
        cross_attention_dim = None if name.endswith("attn1.processor") else unet.config.cross_attention_dim
@@ -467,12 +484,6 @@ def main():
    else:
        optimizer_class = torch.optim.AdamW
-    weight_dtype = torch.float32
-    if args.mixed_precision == "fp16":
-        weight_dtype = torch.float16
-    elif args.mixed_precision == "bf16":
-        weight_dtype = torch.bfloat16
    trainer = partial(
        train,
        accelerator=accelerator,
author	Volpeon <git@volpeon.ink>	2023-02-08 07:27:55 +0100
committer	Volpeon <git@volpeon.ink>	2023-02-08 07:27:55 +0100
commit	9ea20241bbeb2f32199067096272e13647c512eb (patch)
tree	9e0891a74d0965da75e9d3f30628b69d5ba3deaf /train_lora.py
parent	Fix Lora memory usage (diff)
download	textual-inversion-diff-9ea20241bbeb2f32199067096272e13647c512eb.tar.gz textual-inversion-diff-9ea20241bbeb2f32199067096272e13647c512eb.tar.bz2 textual-inversion-diff-9ea20241bbeb2f32199067096272e13647c512eb.zip