1 files changed, 23 insertions, 20 deletions
diff --git a/training/optimization.py b/training/optimization.py
index a0c8673..dfee2b5 100644
--- a/training/optimization.py
+++ b/training/optimization.py
@@ -1,4 +1,7 @@
 import math
+from typing import Literal
+import torch
 from torch.optim.lr_scheduler import LambdaLR
 from diffusers.utils import logging
@@ -6,41 +9,41 @@ from diffusers.utils import logging
 logger = logging.get_logger(__name__)
-def get_one_cycle_schedule(optimizer, num_training_steps, annealing="cos", min_lr=0.04, mid_point=0.3, last_epoch=-1):
+def get_one_cycle_schedule(
-    """
+    optimizer: torch.optim.Optimizer,
-    Create a schedule with a learning rate that decreases linearly from the initial lr set in the optimizer to 0, after
+    num_training_steps: int,
-    a warmup period during which it increases linearly from 0 to the initial lr set in the optimizer.
+    warmup: Literal["cos", "linear"] = "cos",
-    Args:
+    annealing: Literal["cos", "half_cos", "linear"] = "cos",
-        optimizer ([`~torch.optim.Optimizer`]):
+    min_lr: int = 0.04,
-            The optimizer for which to schedule the learning rate.
+    mid_point: int = 0.3,
-        num_training_steps (`int`):
+    last_epoch: int = -1
-            The total number of training steps.
+):
-        last_epoch (`int`, *optional*, defaults to -1):
-            The index of the last epoch when resuming training.
-    Return:
-        `torch.optim.lr_scheduler.LambdaLR` with the appropriate schedule.
-    """
    def lr_lambda(current_step: int):
        thresh_up = int(num_training_steps * min(mid_point, 0.5))
        if current_step < thresh_up:
-            return min_lr + float(current_step) / float(max(1, thresh_up)) * (1 - min_lr)
+            progress = float(current_step) / float(max(1, thresh_up))
+            if warmup == "linear":
+                return min_lr + progress * (1 - min_lr)
+            return min_lr + 0.5 * (1.0 + math.cos(math.pi * (1 + progress)))
        if annealing == "linear":
            thresh_down = thresh_up * 2
            if current_step < thresh_down:
-                return min_lr + float(thresh_down - current_step) / float(max(1, thresh_down - thresh_up)) * (1 - min_lr)
+                progress = float(thresh_down - current_step) / float(max(1, thresh_down - thresh_up))
+                return min_lr + progress * (1 - min_lr)
            progress = float(num_training_steps - current_step) / float(max(1, num_training_steps - thresh_down))
-            return max(0.0, progress) * min_lr
+            return progress * min_lr
        progress = float(current_step - thresh_up) / float(max(1, num_training_steps - thresh_up))
        if annealing == "half_cos":
-            return max(0.0, 1.0 + math.cos(math.pi * (0.5 + 0.5 * progress)))
+            return 1.0 + math.cos(math.pi * (0.5 + 0.5 * progress))
-        return max(0.0, 0.5 * (1.0 + math.cos(math.pi * progress)))
+        return 0.5 * (1.0 + math.cos(math.pi * progress))
    return LambdaLR(optimizer, lr_lambda, last_epoch)