Spaces:

Hazem
/

Fac256xc

Runtime error

boris commited on Apr 16, 2022

Commit

89b4c45

1 Parent(s): 23c1ef6

feat(train): arg to offset lr for resumed runs

Files changed (1) hide show

tools/train/train.py CHANGED Viewed

@@ -406,7 +406,12 @@ class TrainingArguments:
             "help": "Whether to use staircase or continuous learning rate when using exponential decay."
         },
     )
     logging_steps: int = field(
         default=40, metadata={"help": "Log every X updates steps."}
     )
@@ -781,7 +786,7 @@ def main():
             transition_steps=training_args.warmup_steps + 1,  # ensure not 0
         )
         # offset step when resuming
-        if model_metadata.get("step", 0):
             warmup_fn = optax.join_schedules(
                 schedules=[optax.constant_schedule(0.0), warmup_fn],
                 boundaries=[model_metadata["step"]],

             "help": "Whether to use staircase or continuous learning rate when using exponential decay."
         },
     )
+    lr_resume_offset: bool = field(
+        default=False,
+        metadata={
+            "help": "Whether to offset the learning rate function with current step when resuming a run."
+        },
+    )
     logging_steps: int = field(
         default=40, metadata={"help": "Log every X updates steps."}
     )
             transition_steps=training_args.warmup_steps + 1,  # ensure not 0
         )
         # offset step when resuming
+        if model_metadata.get("step", 0) and training_args.lr_resume_offset:
             warmup_fn = optax.join_schedules(
                 schedules=[optax.constant_schedule(0.0), warmup_fn],
                 boundaries=[model_metadata["step"]],