From 46d631759f59bc6b65458202641e5f5a9bc30b7b Mon Sep 17 00:00:00 2001 From: Volpeon Date: Mon, 2 Jan 2023 20:13:59 +0100 Subject: Fixed LR finder --- train_ti.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) (limited to 'train_ti.py') diff --git a/train_ti.py b/train_ti.py index 2b3f017..102c0fa 100644 --- a/train_ti.py +++ b/train_ti.py @@ -584,7 +584,7 @@ def main(): ) if args.find_lr: - args.learning_rate = 1e2 + args.learning_rate = 1e-4 # Use 8-bit Adam for lower memory usage or to fine-tune the model in 16GB GPUs if args.use_8bit_adam: @@ -853,9 +853,9 @@ def main(): on_train=lambda: tokenizer.set_use_vector_shuffle(args.vector_shuffle), on_eval=lambda: tokenizer.set_use_vector_shuffle(False) ) - lr_finder.run(min_lr=1e-4) + lr_finder.run(end_lr=1e2) - plt.savefig(basepath.joinpath("lr.png")) + plt.savefig(basepath.joinpath("lr.png"), dpi=300) plt.close() quit() -- cgit v1.2.3-54-g00ecf