|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from enum import Enum |
|
|
|
|
|
from cosmos_predict1.tokenizer.networks.configs import continuous_image_8x8_360p as continuous_image_8x8_360p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import continuous_image_16x16_360p as continuous_image_16x16_360p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import continuous_video_4x8x8_360p as continuous_video_4x8x8_360p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import continuous_video_8x8x8_720p as continuous_video_8x8x8_720p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import discrete_image_8x8_360p as discrete_image_8x8_360p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import discrete_image_16x16_360p as discrete_image_16x16_360p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import discrete_video_4x8x8_360p as discrete_video_4x8x8_360p_dict |
|
|
from cosmos_predict1.tokenizer.networks.configs import discrete_video_8x16x16_720p as discrete_video_8x16x16_720p_dict |
|
|
from cosmos_predict1.tokenizer.networks.continuous_image import ContinuousImageTokenizer |
|
|
from cosmos_predict1.tokenizer.networks.continuous_video import CausalContinuousVideoTokenizer |
|
|
from cosmos_predict1.tokenizer.networks.discrete_image import DiscreteImageTokenizer |
|
|
from cosmos_predict1.tokenizer.networks.discrete_video import CausalDiscreteVideoTokenizer |
|
|
|
|
|
|
|
|
class TokenizerConfigs(Enum): |
|
|
"""Continuous Image (CI) Tokenizer Configs""" |
|
|
|
|
|
|
|
|
CI8x8_360p = continuous_image_8x8_360p_dict |
|
|
|
|
|
|
|
|
CI16x16_360p = continuous_image_16x16_360p_dict |
|
|
|
|
|
"""Discrete Image (DI) Tokenizer Configs""" |
|
|
|
|
|
DI8x8_360p = discrete_image_8x8_360p_dict |
|
|
|
|
|
|
|
|
DI16x16_360p = discrete_image_16x16_360p_dict |
|
|
|
|
|
"""Causal Continuous Video (CV) Tokenizer Configs""" |
|
|
|
|
|
CV8x8x8_720p = continuous_video_8x8x8_720p_dict |
|
|
|
|
|
|
|
|
CV4x8x8_360p = continuous_video_4x8x8_360p_dict |
|
|
|
|
|
"""Causal Discrete Video (DV) Tokenizer Configs""" |
|
|
|
|
|
DV8x16x16_720p = discrete_video_8x16x16_720p_dict |
|
|
|
|
|
|
|
|
DV4x8x8_360p = discrete_video_4x8x8_360p_dict |
|
|
|
|
|
|
|
|
class TokenizerModels(Enum): |
|
|
CI = ContinuousImageTokenizer |
|
|
DI = DiscreteImageTokenizer |
|
|
CV = CausalContinuousVideoTokenizer |
|
|
DV = CausalDiscreteVideoTokenizer |
|
|
|