OpenMOSS-Team
/

MOSS-VL-Base-0408

Video-Text-to-Text

feature-extraction

Video-Understanding

Image-Understanding

vision-language

Model card Files Files and versions

CCCCyx commited on Apr 23

Commit

fe6fdd6

·

verified ·

1 Parent(s): caf6173

Update modeling_moss_vl.py

Files changed (1) hide show

modeling_moss_vl.py +5 -1

modeling_moss_vl.py CHANGED Viewed

@@ -2094,7 +2094,11 @@ class MossVLModel(MossVLPreTrainedModel):
     """
 )
 class MossVLForConditionalGeneration(MossVLPreTrainedModel, GenerationMixin):
-    _tied_weights_keys = ["lm_head.weight"]
     config: MossVLConfig
     _checkpoint_conversion_mapping = {}
     accepts_loss_kwargs = False

     """
 )
 class MossVLForConditionalGeneration(MossVLPreTrainedModel, GenerationMixin):
+    # transformers 5.x expects a dict[target, source]; MossVL does not tie
+    # lm_head to the embeddings (config.tie_word_embeddings is False), so the
+    # mapping is empty. The legacy list format ["lm_head.weight"] breaks
+    # save_pretrained in transformers>=5.
+    _tied_weights_keys: dict[str, str] = {}
     config: MossVLConfig
     _checkpoint_conversion_mapping = {}
     accepts_loss_kwargs = False