|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from hydra.core.config_store import ConfigStore |
|
|
|
|
|
from cosmos_predict1.diffusion.networks.general_dit_video_conditioned import VideoExtendGeneralDIT |
|
|
from cosmos_predict1.utils.lazy_config import LazyCall as L |
|
|
from cosmos_predict1.utils.lazy_config import LazyDict |
|
|
|
|
|
GEN3C_Cosmos_7B: LazyDict = LazyDict( |
|
|
dict( |
|
|
defaults=[ |
|
|
{"override /net": "faditv2_7b"}, |
|
|
{"override /conditioner": "video_cond"}, |
|
|
{"override /tokenizer": "cosmos_diffusion_tokenizer_res720_comp8x8x8_t121_ver092624"}, |
|
|
"_self_", |
|
|
], |
|
|
model=dict( |
|
|
latent_shape=[ |
|
|
16, |
|
|
16, |
|
|
88, |
|
|
160, |
|
|
], |
|
|
conditioner=dict(video_cond_bool=dict()), |
|
|
net=L(VideoExtendGeneralDIT)( |
|
|
rope_h_extrapolation_ratio=1.0, |
|
|
rope_w_extrapolation_ratio=1.0, |
|
|
rope_t_extrapolation_ratio=2.0, |
|
|
in_channels=16 + 16 * 4 + 1 |
|
|
), |
|
|
frame_buffer_max=2, |
|
|
), |
|
|
job=dict(group="Gen3c", name="GEN3C_Cosmos_7B"), |
|
|
) |
|
|
) |
|
|
|
|
|
cs = ConfigStore.instance() |
|
|
for _item in [ |
|
|
GEN3C_Cosmos_7B, |
|
|
]: |
|
|
cs.store(group="experiment", package="_global_", name=_item["job"]["name"], node=_item) |
|
|
|