|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from cosmos_predict1.diffusion.training.functional.lr_scheduler import LambdaLinearScheduler |
|
|
from cosmos_predict1.diffusion.training.utils.optim_instantiate import get_base_optimizer |
|
|
from cosmos_predict1.utils.lazy_config import PLACEHOLDER |
|
|
from cosmos_predict1.utils.lazy_config import LazyCall as L |
|
|
from cosmos_predict1.utils.lazy_config import LazyDict |
|
|
|
|
|
FusedAdamWConfig: LazyDict = L(get_base_optimizer)( |
|
|
model=PLACEHOLDER, |
|
|
lr=1e-4, |
|
|
weight_decay=0.3, |
|
|
betas=[0.9, 0.999], |
|
|
optim_type="fusedadam", |
|
|
eps=1e-8, |
|
|
sharding=False, |
|
|
master_weights=True, |
|
|
capturable=True, |
|
|
) |
|
|
|
|
|
LambdaLinearSchedulerConfig: LazyDict = L(LambdaLinearScheduler)( |
|
|
warm_up_steps=[1000], |
|
|
cycle_lengths=[10000000000000], |
|
|
f_start=[1.0e-6], |
|
|
f_max=[1.0], |
|
|
f_min=[1.0], |
|
|
) |
|
|
|