from transformers import Dinov2Model def build_vision_encoder(config): if config.model_type == "dinov2": model = Dinov2Model.from_pretrained(config.pretrained_name_or_path) else: raise NotImplementedError() return model