File size: 344 Bytes
3e270dc
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
{
  "model_type": "ValueModel",
  "base_model": "Qwen/Qwen2.5-Math-1.5B-Instruct",
  "value_head": {
    "file": "value_head.safetensors",
    "shape": [
      1,
      1536
    ],
    "dtype": "torch.bfloat16"
  },
  "inference_note": "Load base model via transformers; load value_head.safetensors separately and apply on last_hidden_state."
}