Audio Classification
Transformers
Safetensors
Chinese
qwen2_audio
text2text-generation
File size: 804 Bytes
9fd670d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
{
  "_name_or_path": "/mnt/dolphinfs/hdd_pool/docker/user/hadoop-aipnlp/EVA/lishuailin/qwen-audio-sft/Qwen2-Audio-7B-Instruct",
  "architectures": [
    "Qwen2AudioForConditionalGeneration"
  ],
  "audio_config": {
    "model_type": "qwen2_audio_encoder"
  },
  "audio_token_index": 151646,
  "hidden_size": 4096,
  "ignore_index": -100,
  "keys_to_ignore_at_inference": [
    "past_key_values"
  ],
  "model_type": "qwen2_audio",
  "text_config": {
    "bos_token_id": 151643,
    "eos_token_id": 151645,
    "intermediate_size": 11008,
    "max_position_embeddings": 8192,
    "model_type": "qwen2",
    "rms_norm_eps": 1e-05,
    "torch_dtype": "bfloat16",
    "use_mrope": false,
    "vocab_size": 156032
  },
  "torch_dtype": "bfloat16",
  "transformers_version": "4.46.3",
  "vocab_size": 156032
}