|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from hydra.core.config_store import ConfigStore |
|
|
|
|
|
from cosmos_predict1.diffusion.networks.general_dit_video_conditioned_multiview import MultiviewVideoExtendGeneralDIT |
|
|
from cosmos_predict1.utils.lazy_config import LazyCall as L |
|
|
from cosmos_predict1.utils.lazy_config import LazyDict |
|
|
|
|
|
Cosmos_Predict1_Video2World_7B_Multiview: LazyDict = LazyDict( |
|
|
dict( |
|
|
defaults=[ |
|
|
"/experiment/Cosmos_Predict1_Text2World_7B_Multiview", |
|
|
{"override /conditioner": "video_cond_frame_repeat"}, |
|
|
"_self_", |
|
|
], |
|
|
job=dict( |
|
|
group="Text2World", |
|
|
name="Cosmos_Predict1_Video2World_7B_Multiview", |
|
|
), |
|
|
model=dict( |
|
|
latent_shape=[ |
|
|
16, |
|
|
16, |
|
|
88, |
|
|
160, |
|
|
], |
|
|
net=L(MultiviewVideoExtendGeneralDIT)( |
|
|
n_views=6, |
|
|
view_condition_dim=6, |
|
|
add_repeat_frame_embedding=True, |
|
|
), |
|
|
conditioner=dict(video_cond_bool=dict()), |
|
|
), |
|
|
) |
|
|
) |
|
|
|
|
|
|
|
|
cs = ConfigStore.instance() |
|
|
cs.store( |
|
|
group="experiment", |
|
|
package="_global_", |
|
|
name=Cosmos_Predict1_Video2World_7B_Multiview["job"]["name"], |
|
|
node=Cosmos_Predict1_Video2World_7B_Multiview, |
|
|
) |
|
|
|