{ "quantization_method": "bitsandbytes", "bits": 8, "quant_type": "int8", "double_quant": false, "modules_not_quantized": [ "acoustic_tokenizer_encoder", "semantic_tokenizer_encoder", "acoustic_projection", "semantic_projection", "lm_head" ], "modules_quantized": [ "language_model (excluding lm_head)" ], "base_model": "microsoft/VibeVoice-ASR-HF", "transformers_version": "5.3.0" }