{ "name": "FastSpeech2", "id": "ie2sc9g1qk00", "description": "FastSpeech2 是一种高效的端到端语音合成模型。相比 FastSpeech,FastSpeech2 引入了多尺度时长预测器和能量 / 基频预测分支,优化了时长预测模块并新增韵律特征建模,在合成速度和语音自然度上均有大幅提升。", "category": "音频", "framework": [ "PyTorch" ], "supportOs": [ "OpenHarmony", "Linux" ], "computingPower": [ "Hi3403V100 SVP_NNN" ], "tags": [ "文本转语音" ], "repositoryUrl": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/README.md", "licenseUrl": "https://github.com/ming024/FastSpeech2/blob/master/LICENSE", "downloads": [ { "fileName": "fastspeech_hifigan_en.onnx", "variants": [ "源模型 / 源模型下载", "源模型 / 源模型元数据", "编译模型 / OM 元数据 / a16w8" ] } ], "apiDetail": { "createdBy": 139318985286440, "creationDate": "2026-01-08 16:18:57", "creationUserCN": "sloanqin", "lastUpdatedBy": null, "lastUpdateDate": "2026-01-09 15:08:50", "lastUpdateUserCN": "sloanqin", "rowIdx": -1, "id": "ie2sc9g1qk00", "name": "FastSpeech2", "isBeta": 1, "betaVersionDesc": "CANN包版本需要适配修改待发布", "description": "FastSpeech2 是一种高效的端到端语音合成模型。相比 FastSpeech,FastSpeech2 引入了多尺度时长预测器和能量 / 基频预测分支,优化了时长预测模块并新增韵律特征建模,在合成速度和语音自然度上均有大幅提升。", "parentId": "ie2sc9g1qk00", "coverImageId": 1722265270026243, "coverImageUrl": "https://openxinhuo-board-image.obs.cn-east-3.myhuaweicloud.com/1722265270026243%2Ffastspeech2.jpg", "modelEffectId": null, "modelEffectUrl": "", "computerVersion": [], "naturalLanguageProcess": [], "multimodal": [], "video": [ "文本转语音" ], "framework": [ "PyTorch" ], "modelRepository": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/README.md", "originModel": [ { "id": "1722129101946883", "name": "fastspeech_hifigan_en.onnx", "url": null, "size": "142724651" } ], "originModelLink": null, "dataSet": "https://data.keithito.com/data/speech/LJSpeech-1.1.tar.bz2", "modelLicense": "https://github.com/ming024/FastSpeech2/blob/master/LICENSE", "detailParams": [ { "name": "输入", "value": "1x40" }, { "name": "参数量", "value": "35.266M" }, { "name": "计算量", "value": "29.162GFLOPs" } ], "quickStart": { "url": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2", "markDownUrl": "", "developLanguage": [ { "language": "C++", "context": "{\"ops\":[{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"模型可以通过以下代码完成快速推理\"},{\"attributes\":{\"text-indent\":\"0px\"},\"insert\":\"\\n\"},{\"insert\":\"#include \\\"model.h\\\"\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"#include \\\"log.h\\\"\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\\n\"},{\"insert\":\"using namespace Infer;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\\n\"},{\"insert\":\"int main()\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"{\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    EnvInit();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    std::string omModelPath = \\\"/path/to/model.om\\\"; // 模型文件路径 \"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    std::string filePath= \\\"/path/to/file_list.json\\\"; // 输入文本文件路径\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    std::unique_ptr model = std::make_unique();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    if (model->Load(omModelPath, ModelType::FastSpeech2) != 0) {\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        LOG(ERROR) << \\\"fail to load model\\\";\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        return -1;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    }\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    auto ret = model->Infer(filePath, FileType::JsonFile);\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    if (ret.size() == 0) {\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        LOG(ERROR) << \\\"fail to infer model\\\";\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        model->Unload();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        return -1;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    }\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    if (model->Unload() != 0) {\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        LOG(ERROR) << \\\"fail to unload model\\\";\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        return -1;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    }\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    EnvDeinit();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    return 0;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"}\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"备注:上述C++代码依赖的动态库与头文件位于\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#095eab\",\"size\":\"16px\",\"background\":\"transparent\",\"link\":\"https://gitee.com/HiSpark/modelzoo/tree/master/samples/common\"},\"insert\":\"/samples/common\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"目录下,编译相关配置参考\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#095eab\",\"size\":\"16px\",\"background\":\"transparent\",\"link\":\"https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/src/CMakeLists.txt\"},\"insert\":\"CMakeLists.txt\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"。\"},{\"attributes\":{\"text-indent\":\"0px\"},\"insert\":\"\\n\"},{\"insert\":\"\\n\"}]}" } ] }, "status": "released", "currentHandler": "", "currentHandlerName": "", "jsonPath": "https://gitee.com/sloanqin/modelzoo-dev/blob/fastspeech2/samples/built-in/audio/FastSpeech2/fastspeech2.json", "modelAdaptor": [ { "createdBy": null, "creationDate": null, "creationUserCN": null, "lastUpdatedBy": null, "lastUpdateDate": null, "lastUpdateUserCN": null, "rowIdx": -1, "id": "i8ttm5k1tc00", "name": "Hi3403V100 SVP_NNN", "modelId": "ie2sc9g1qk00", "modelName": "FastSpeech2", "supportNames": [ "a16w8" ], "toolkit": [ { "name": "CANN配置", "url": "", "desc": "6.10.t01spc030b660;(请联系FAE获取)", "imgId": "cann" }, { "name": "编译工具库", "url": "https://gitee.com/HiSpark/pegasus/blob/Beta-v0.9.1/docs/Hi3403V100%E7%8E%AF%E5%A2%83%E6%90%AD%E5%BB%BA%E6%8C%87%E5%8D%97/Hi3403V100%E7%8E%AF%E5%A2%83%E6%90%AD%E5%BB%BA%E6%8C%87%E5%8D%97.md", "desc": "高效编译,精准适配;AI性能优化,应用流畅运行", "imgId": "tool" }, { "name": "SDK", "url": "https://gitee.com/HiSpark/ss928v100_clang/tree/Beta-v0.9.1/", "desc": "稳定、易用的设计;支撑客户快速产品量产", "imgId": "sdk" } ], "supportOs": [ "OpenHarmony", "Linux" ], "supportQuantify": [ { "createdBy": 132241120926760, "creationDate": "2026-03-26 19:50:46", "creationUserCN": "liaoshibin", "lastUpdatedBy": 132241120926760, "lastUpdateDate": "2026-03-26 19:50:46", "lastUpdateUserCN": "liaoshibin", "rowIdx": -1, "id": "j6tf932ci000", "name": "a16w8", "computingId": "i8ttm5k1tc00", "computingName": "Hi3403V100 SVP_NNN", "omOfflineModelUrl": null, "omOfflineModelId": 1722129460559875, "omOfflineModelSize": "40041177", "omOfflineModelName": "fastspeech_hifigan_en.om", "omOfflineModel": [ { "id": "1722129460559875", "name": "fastspeech_hifigan_en.om", "url": null, "size": "40041177" } ], "omOfflineModelLink": null, "releaseTime": "2026-01-11", "boardOs": null, "modelLicense": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/LICENSE", "modelPerformance": [ { "performanceValue": "52.49", "unit": "耗时(ms)", "desc": null }, { "performanceValue": "19.05", "unit": "性能(fps)", "desc": "" }, { "performanceValue": "488.799", "unit": "单帧内存带宽(MB)", "desc": "" }, { "performanceValue": "1.418", "unit": "内存(MB)", "desc": "" } ], "deleted": 0 } ], "deleted": 0 } ], "saveType": null, "deleteType": null, "latest": "Y", "deleted": 0, "modelPhase": "released", "remark": null, "fileInfo": null, "reviewType": null, "owner": "sloanqin", "ownerBy": 139318985286440, "optional": null, "optionalList": [ "whalenowings", "0e900d99dee8461b8" ], "optionalBy": null, "downloadNum": 23, "collectNum": null, "isCollect": null } }