This commit is contained in:
mrq 2025-02-28 22:15:37 -06:00
parent ddc49c89c5
commit 56f8be4d62
2 changed files with 2 additions and 2 deletions

View File

@ -446,7 +446,7 @@ class Engines(dict[str, Engine]):
engine.tokens_processed = 0
# update the LR because for some god awful reason it gets overwritten when loading from a checkpoint but only when it's not using a scheduler
if cfg.hyperparameters.scheduler_type == "":
if cfg.hyperparameters.scheduler == "":
self.set_lr(cfg.hyperparameters.learning_rate)
self._update()

View File

@ -47,7 +47,7 @@ class Engine(DeepSpeedEngine):
}
# kwargs['stats'] = None will return None when popped
maybe_stats = kwargs.get('stats', stats)
maybe_stats = kwargs.pop('stats', stats)
if maybe_stats is not None:
stats = maybe_stats