summaryrefslogtreecommitdiffstats
path: root/train_ti.py
diff options
context:
space:
mode:
Diffstat (limited to 'train_ti.py')
-rw-r--r--train_ti.py16
1 files changed, 4 insertions, 12 deletions
diff --git a/train_ti.py b/train_ti.py
index 0891c49..fc34d27 100644
--- a/train_ti.py
+++ b/train_ti.py
@@ -159,7 +159,7 @@ def parse_args():
159 parser.add_argument( 159 parser.add_argument(
160 "--tag_dropout", 160 "--tag_dropout",
161 type=float, 161 type=float,
162 default=0, 162 default=0.1,
163 help="Tag dropout probability.", 163 help="Tag dropout probability.",
164 ) 164 )
165 parser.add_argument( 165 parser.add_argument(
@@ -406,18 +406,12 @@ def parse_args():
406 help="Embedding decay target." 406 help="Embedding decay target."
407 ) 407 )
408 parser.add_argument( 408 parser.add_argument(
409 "--emb_decay_factor", 409 "--emb_decay",
410 default=1, 410 default=1e-1,
411 type=float, 411 type=float,
412 help="Embedding decay factor." 412 help="Embedding decay factor."
413 ) 413 )
414 parser.add_argument( 414 parser.add_argument(
415 "--emb_decay_start",
416 default=0,
417 type=float,
418 help="Embedding decay start offset."
419 )
420 parser.add_argument(
421 "--noise_timesteps", 415 "--noise_timesteps",
422 type=int, 416 type=int,
423 default=1000, 417 default=1000,
@@ -587,12 +581,10 @@ def main():
587 tokenizer=tokenizer, 581 tokenizer=tokenizer,
588 sample_scheduler=sample_scheduler, 582 sample_scheduler=sample_scheduler,
589 checkpoint_output_dir=checkpoint_output_dir, 583 checkpoint_output_dir=checkpoint_output_dir,
590 learning_rate=args.learning_rate,
591 gradient_checkpointing=args.gradient_checkpointing, 584 gradient_checkpointing=args.gradient_checkpointing,
592 use_emb_decay=args.use_emb_decay, 585 use_emb_decay=args.use_emb_decay,
593 emb_decay_target=args.emb_decay_target, 586 emb_decay_target=args.emb_decay_target,
594 emb_decay_factor=args.emb_decay_factor, 587 emb_decay=args.emb_decay,
595 emb_decay_start=args.emb_decay_start,
596 use_ema=args.use_ema, 588 use_ema=args.use_ema,
597 ema_inv_gamma=args.ema_inv_gamma, 589 ema_inv_gamma=args.ema_inv_gamma,
598 ema_power=args.ema_power, 590 ema_power=args.ema_power,