HF checkpoints i removed the optimizer to save space, init Adam without the first/second moments is ok
This commit is contained in:
@@ -179,7 +179,7 @@ scaler = torch.cuda.amp.GradScaler(enabled=(dtype == "float16"))
|
|||||||
|
|
||||||
# optimizer
|
# optimizer
|
||||||
optimizer = model.configure_optimizers(weight_decay, learning_rate, (beta1, beta2), device_type)
|
optimizer = model.configure_optimizers(weight_decay, learning_rate, (beta1, beta2), device_type)
|
||||||
if init_from == "resume":
|
if init_from == "resume" and "optimizer" in checkpoint:
|
||||||
optimizer.load_state_dict(checkpoint["optimizer"])
|
optimizer.load_state_dict(checkpoint["optimizer"])
|
||||||
checkpoint = None # free up memory
|
checkpoint = None # free up memory
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user