Skip to content
Snippets Groups Projects

Support subword and word language models

Merged Solene Tarride requested to merge subword-and-word-lm into main
All threads resolved!
Compare and Show latest version
8 files
+ 196
133
Compare changes
  • Side-by-side
  • Inline
Files
8
@@ -224,6 +224,8 @@ class GenericTrainingManager:
self.best = checkpoint["best"]
if "scaler_state_dict" in checkpoint:
self.scaler.load_state_dict(checkpoint["scaler_state_dict"])
if "dropout_scheduler_step" in checkpoint:
self.dropout_scheduler.resume(checkpoint["dropout_scheduler_step"])
# Load model weights from past training
for model_name in self.models:
# Transform to DDP/from DDP model
@@ -412,6 +414,7 @@ class GenericTrainingManager:
"scaler_state_dict": self.scaler.state_dict(),
"best": self.best,
"charset": self.dataset.charset,
"dropout_scheduler_step": self.dropout_scheduler.step_num,
}
for model_name in self.optimizers:
Loading