hispark-modelzoo-fastspeech2 / model-card.json
shadow-cann's picture
Add files using upload-large-folder tool
100694b verified
{
"name": "FastSpeech2",
"id": "ie2sc9g1qk00",
"description": "FastSpeech2 是一种高效的端到端语音合成模型。相比 FastSpeech,FastSpeech2 引入了多尺度时长预测器和能量 / 基频预测分支,优化了时长预测模块并新增韵律特征建模,在合成速度和语音自然度上均有大幅提升。",
"category": "音频",
"framework": [
"PyTorch"
],
"supportOs": [
"OpenHarmony",
"Linux"
],
"computingPower": [
"Hi3403V100 SVP_NNN"
],
"tags": [
"文本转语音"
],
"repositoryUrl": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/README.md",
"licenseUrl": "https://github.com/ming024/FastSpeech2/blob/master/LICENSE",
"downloads": [
{
"fileName": "fastspeech_hifigan_en.onnx",
"variants": [
"源模型 / 源模型下载",
"源模型 / 源模型元数据",
"编译模型 / OM 元数据 / a16w8"
]
}
],
"apiDetail": {
"createdBy": 139318985286440,
"creationDate": "2026-01-08 16:18:57",
"creationUserCN": "sloanqin",
"lastUpdatedBy": null,
"lastUpdateDate": "2026-01-09 15:08:50",
"lastUpdateUserCN": "sloanqin",
"rowIdx": -1,
"id": "ie2sc9g1qk00",
"name": "FastSpeech2",
"isBeta": 1,
"betaVersionDesc": "CANN包版本需要适配修改待发布",
"description": "FastSpeech2 是一种高效的端到端语音合成模型。相比 FastSpeech,FastSpeech2 引入了多尺度时长预测器和能量 / 基频预测分支,优化了时长预测模块并新增韵律特征建模,在合成速度和语音自然度上均有大幅提升。",
"parentId": "ie2sc9g1qk00",
"coverImageId": 1722265270026243,
"coverImageUrl": "https://openxinhuo-board-image.obs.cn-east-3.myhuaweicloud.com/1722265270026243%2Ffastspeech2.jpg",
"modelEffectId": null,
"modelEffectUrl": "",
"computerVersion": [],
"naturalLanguageProcess": [],
"multimodal": [],
"video": [
"文本转语音"
],
"framework": [
"PyTorch"
],
"modelRepository": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/README.md",
"originModel": [
{
"id": "1722129101946883",
"name": "fastspeech_hifigan_en.onnx",
"url": null,
"size": "142724651"
}
],
"originModelLink": null,
"dataSet": "https://data.keithito.com/data/speech/LJSpeech-1.1.tar.bz2",
"modelLicense": "https://github.com/ming024/FastSpeech2/blob/master/LICENSE",
"detailParams": [
{
"name": "输入",
"value": "1x40"
},
{
"name": "参数量",
"value": "35.266M"
},
{
"name": "计算量",
"value": "29.162GFLOPs"
}
],
"quickStart": {
"url": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2",
"markDownUrl": "",
"developLanguage": [
{
"language": "C++",
"context": "{\"ops\":[{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"模型可以通过以下代码完成快速推理\"},{\"attributes\":{\"text-indent\":\"0px\"},\"insert\":\"\\n\"},{\"insert\":\"#include \\\"model.h\\\"\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"#include \\\"log.h\\\"\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\\n\"},{\"insert\":\"using namespace Infer;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\\n\"},{\"insert\":\"int main()\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"{\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    EnvInit();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    std::string omModelPath = \\\"/path/to/model.om\\\"; // 模型文件路径 \"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    std::string filePath= \\\"/path/to/file_list.json\\\"; // 输入文本文件路径\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    std::unique_ptr<Model> model = std::make_unique<Model>();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    if (model->Load(omModelPath, ModelType::FastSpeech2) != 0) {\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        LOG(ERROR) << \\\"fail to load model\\\";\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        return -1;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    }\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    auto ret = model->Infer(filePath, FileType::JsonFile);\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    if (ret.size() == 0) {\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        LOG(ERROR) << \\\"fail to infer model\\\";\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        model->Unload();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        return -1;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    }\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    if (model->Unload() != 0) {\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        LOG(ERROR) << \\\"fail to unload model\\\";\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"        return -1;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    }\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    EnvDeinit();\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"    return 0;\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"insert\":\"}\"},{\"attributes\":{\"code-block\":\"plain\"},\"insert\":\"\\n\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"备注:上述C++代码依赖的动态库与头文件位于\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#095eab\",\"size\":\"16px\",\"background\":\"transparent\",\"link\":\"https://gitee.com/HiSpark/modelzoo/tree/master/samples/common\"},\"insert\":\"/samples/common\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"目录下,编译相关配置参考\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#095eab\",\"size\":\"16px\",\"background\":\"transparent\",\"link\":\"https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/src/CMakeLists.txt\"},\"insert\":\"CMakeLists.txt\"},{\"attributes\":{\"line-height\":\"1.6\",\"color\":\"#40485b\",\"size\":\"16px\",\"background\":\"#ffffff\"},\"insert\":\"。\"},{\"attributes\":{\"text-indent\":\"0px\"},\"insert\":\"\\n\"},{\"insert\":\"\\n\"}]}"
}
]
},
"status": "released",
"currentHandler": "",
"currentHandlerName": "",
"jsonPath": "https://gitee.com/sloanqin/modelzoo-dev/blob/fastspeech2/samples/built-in/audio/FastSpeech2/fastspeech2.json",
"modelAdaptor": [
{
"createdBy": null,
"creationDate": null,
"creationUserCN": null,
"lastUpdatedBy": null,
"lastUpdateDate": null,
"lastUpdateUserCN": null,
"rowIdx": -1,
"id": "i8ttm5k1tc00",
"name": "Hi3403V100 SVP_NNN",
"modelId": "ie2sc9g1qk00",
"modelName": "FastSpeech2",
"supportNames": [
"a16w8"
],
"toolkit": [
{
"name": "CANN配置",
"url": "",
"desc": "6.10.t01spc030b660;(请联系FAE获取)",
"imgId": "cann"
},
{
"name": "编译工具库",
"url": "https://gitee.com/HiSpark/pegasus/blob/Beta-v0.9.1/docs/Hi3403V100%E7%8E%AF%E5%A2%83%E6%90%AD%E5%BB%BA%E6%8C%87%E5%8D%97/Hi3403V100%E7%8E%AF%E5%A2%83%E6%90%AD%E5%BB%BA%E6%8C%87%E5%8D%97.md",
"desc": "高效编译,精准适配;AI性能优化,应用流畅运行",
"imgId": "tool"
},
{
"name": "SDK",
"url": "https://gitee.com/HiSpark/ss928v100_clang/tree/Beta-v0.9.1/",
"desc": "稳定、易用的设计;支撑客户快速产品量产",
"imgId": "sdk"
}
],
"supportOs": [
"OpenHarmony",
"Linux"
],
"supportQuantify": [
{
"createdBy": 132241120926760,
"creationDate": "2026-03-26 19:50:46",
"creationUserCN": "liaoshibin",
"lastUpdatedBy": 132241120926760,
"lastUpdateDate": "2026-03-26 19:50:46",
"lastUpdateUserCN": "liaoshibin",
"rowIdx": -1,
"id": "j6tf932ci000",
"name": "a16w8",
"computingId": "i8ttm5k1tc00",
"computingName": "Hi3403V100 SVP_NNN",
"omOfflineModelUrl": null,
"omOfflineModelId": 1722129460559875,
"omOfflineModelSize": "40041177",
"omOfflineModelName": "fastspeech_hifigan_en.om",
"omOfflineModel": [
{
"id": "1722129460559875",
"name": "fastspeech_hifigan_en.om",
"url": null,
"size": "40041177"
}
],
"omOfflineModelLink": null,
"releaseTime": "2026-01-11",
"boardOs": null,
"modelLicense": "https://gitee.com/HiSpark/modelzoo/blob/master/samples/built-in/audio/FastSpeech2/LICENSE",
"modelPerformance": [
{
"performanceValue": "52.49",
"unit": "耗时(ms)",
"desc": null
},
{
"performanceValue": "19.05",
"unit": "性能(fps)",
"desc": ""
},
{
"performanceValue": "488.799",
"unit": "单帧内存带宽(MB)",
"desc": ""
},
{
"performanceValue": "1.418",
"unit": "内存(MB)",
"desc": ""
}
],
"deleted": 0
}
],
"deleted": 0
}
],
"saveType": null,
"deleteType": null,
"latest": "Y",
"deleted": 0,
"modelPhase": "released",
"remark": null,
"fileInfo": null,
"reviewType": null,
"owner": "sloanqin",
"ownerBy": 139318985286440,
"optional": null,
"optionalList": [
"whalenowings",
"0e900d99dee8461b8"
],
"optionalBy": null,
"downloadNum": 23,
"collectNum": null,
"isCollect": null
}
}