|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from hydra.core.config_store import ConfigStore |
|
|
|
|
|
from cosmos_predict1.utils.lazy_config import LazyCall as L |
|
|
from cosmos_predict1.utils.lazy_config import LazyDict |
|
|
|
|
|
Cosmos_Predict1_Text2World_7B_Multiview: LazyDict = LazyDict( |
|
|
dict( |
|
|
defaults=[ |
|
|
"/experiment/Cosmos_Predict1_Text2World_7B", |
|
|
{"override /net": "faditv2_multiview_7b"}, |
|
|
{"override /conditioner": "add_fps_image_size_padding_mask_frame_repeat"}, |
|
|
"_self_", |
|
|
], |
|
|
job=dict( |
|
|
group="Text2World", |
|
|
name="Cosmos_Predict1_Text2World_7B_Multiview", |
|
|
), |
|
|
model=dict( |
|
|
latent_shape=[ |
|
|
16, |
|
|
16, |
|
|
88, |
|
|
160, |
|
|
], |
|
|
tokenizer=dict( |
|
|
video_vae=dict( |
|
|
pixel_chunk_duration=57, |
|
|
) |
|
|
), |
|
|
), |
|
|
) |
|
|
) |
|
|
|
|
|
|
|
|
cs = ConfigStore.instance() |
|
|
cs.store( |
|
|
group="experiment", |
|
|
package="_global_", |
|
|
name=Cosmos_Predict1_Text2World_7B_Multiview["job"]["name"], |
|
|
node=Cosmos_Predict1_Text2World_7B_Multiview, |
|
|
) |
|
|
|