Fix AIMv2 checkpoint/config compatibility with custom HF code

This PR makes the uploaded checkpoint consistent with the custom `modeling_aimv2.py` implementation shipped in the repository.

- remap tensor names in `model.safetensors` to match `AIMv2Model.state_dict()`
- update `config.json` so `architectures` and `model_type` align with the shipped config/model classes

Without these changes, loading via `AutoModel.from_pretrained(..., trust_remote_code=True)` initializes most model weights from scratch instead of loading the published checkpoint.

Files changed (2) hide show

config.json +2 -2
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "architectures": [
-    "Aimv2VisionModel"
   ],
   "attention_dropout": 0.0,
   "auto_map": {
@@ -15,7 +15,7 @@
   "intermediate_size": 2816,
   "is_native": false,
   "mlp_bias": false,
-  "model_type": "aimv2_vision_model",
   "num_attention_heads": 8,
   "num_channels": 3,
   "num_hidden_layers": 24,

 {
   "architectures": [
+    "AIMv2Model"
   ],
   "attention_dropout": 0.0,
   "auto_map": {
   "intermediate_size": 2816,
   "is_native": false,
   "mlp_bias": false,
+  "model_type": "aimv2",
   "num_attention_heads": 8,
   "num_channels": 3,
   "num_hidden_layers": 24,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7d28174ebb3d01b21053827e27e8e9e59960f0ef2907298b977a1da56f9e3982
-size 1236816248

 version https://git-lfs.github.com/spec/v1
+oid sha256:2d467ee5b52efcfed8bc18fe10e63879d049a03ed9adbd2529a4657f32355ff2
+size 1236809360