|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from nemo.lightning.pytorch.optim.base import LRSchedulerModule, OptimizerModule |
|
|
from nemo.lightning.pytorch.optim.lr_scheduler import ( |
|
|
CosineAnnealingScheduler, |
|
|
InverseSquareRootAnnealingScheduler, |
|
|
NoamAnnealingScheduler, |
|
|
NoamHoldAnnealingScheduler, |
|
|
PolynomialDecayAnnealingScheduler, |
|
|
PolynomialHoldDecayAnnealingScheduler, |
|
|
SquareAnnealingScheduler, |
|
|
SquareRootAnnealingScheduler, |
|
|
T5InverseSquareRootAnnealingScheduler, |
|
|
WarmupAnnealingScheduler, |
|
|
WarmupHoldPolicyScheduler, |
|
|
WarmupPolicyScheduler, |
|
|
) |
|
|
from nemo.lightning.pytorch.optim.megatron import MegatronOptimizerModule |
|
|
from nemo.lightning.pytorch.optim.pytorch import PytorchOptimizerModule |
|
|
|
|
|
__all__ = [ |
|
|
"OptimizerModule", |
|
|
"LRSchedulerModule", |
|
|
"MegatronOptimizerModule", |
|
|
"WarmupPolicyScheduler", |
|
|
"WarmupHoldPolicyScheduler", |
|
|
"SquareAnnealingScheduler", |
|
|
"SquareRootAnnealingScheduler", |
|
|
"NoamAnnealingScheduler", |
|
|
"NoamHoldAnnealingScheduler", |
|
|
"WarmupAnnealingScheduler", |
|
|
"InverseSquareRootAnnealingScheduler", |
|
|
"T5InverseSquareRootAnnealingScheduler", |
|
|
"PolynomialDecayAnnealingScheduler", |
|
|
"PolynomialHoldDecayAnnealingScheduler", |
|
|
"CosineAnnealingScheduler", |
|
|
"PytorchOptimizerModule", |
|
|
] |
|
|
|