HF checkpoints i removed the optimizer to save space, init Adam without the first/second moments is ok
This commit is contained in:
@@ -179,7 +179,7 @@ scaler = torch.cuda.amp.GradScaler(enabled=(dtype == "float16"))
|
||||
|
||||
# optimizer
|
||||
optimizer = model.configure_optimizers(weight_decay, learning_rate, (beta1, beta2), device_type)
|
||||
if init_from == "resume":
|
||||
if init_from == "resume" and "optimizer" in checkpoint:
|
||||
optimizer.load_state_dict(checkpoint["optimizer"])
|
||||
checkpoint = None # free up memory
|
||||
|
||||
|
||||
Reference in New Issue
Block a user