| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| #include "ms_mgau.h" |
|
|
| static ps_mgaufuncs_t ms_mgau_funcs = { |
| "ms", |
| ms_cont_mgau_frame_eval, |
| ms_mgau_mllr_transform, |
| ms_mgau_free |
| }; |
|
|
| ps_mgau_t * |
| ms_mgau_init(acmod_t *acmod, logmath_t *lmath, bin_mdef_t *mdef) |
| { |
| |
| ms_mgau_model_t *msg; |
| ps_mgau_t *mg; |
| gauden_t *g; |
| senone_t *s; |
| cmd_ln_t *config; |
| int i; |
|
|
| config = acmod->config; |
|
|
| msg = (ms_mgau_model_t *) ckd_calloc(1, sizeof(ms_mgau_model_t)); |
| msg->config = config; |
| msg->g = NULL; |
| msg->s = NULL; |
| |
| if ((g = msg->g = gauden_init(ps_config_str(config, "mean"), |
| ps_config_str(config, "var"), |
| ps_config_float(config, "varfloor"), |
| lmath)) == NULL) { |
| E_ERROR("Failed to read means and variances\n"); |
| goto error_out; |
| } |
|
|
| |
| if (g->n_feat != feat_dimension1(acmod->fcb)) { |
| E_ERROR("Number of streams does not match: %d != %d\n", |
| g->n_feat, feat_dimension1(acmod->fcb)); |
| goto error_out; |
| } |
| for (i = 0; i < g->n_feat; ++i) { |
| if ((uint32)g->featlen[i] != feat_dimension2(acmod->fcb, i)) { |
| E_ERROR("Dimension of stream %d does not match: %d != %d\n", i, |
| g->featlen[i], feat_dimension2(acmod->fcb, i)); |
| goto error_out; |
| } |
| } |
|
|
| s = msg->s = senone_init(msg->g, |
| ps_config_str(config, "mixw"), |
| ps_config_str(config, "senmgau"), |
| ps_config_float(config, "mixwfloor"), |
| lmath, mdef); |
|
|
| s->aw = ps_config_int(config, "aw"); |
|
|
| |
| if (s->n_feat != (uint32)g->n_feat) |
| E_FATAL("#Feature mismatch: gauden= %d, senone= %d\n", g->n_feat, |
| s->n_feat); |
| if (s->n_cw != (uint32)g->n_density) |
| E_FATAL("#Densities mismatch: gauden= %d, senone= %d\n", |
| g->n_density, s->n_cw); |
| if (s->n_gauden > (uint32)g->n_mgau) |
| E_FATAL("Senones need more codebooks (%d) than present (%d)\n", |
| s->n_gauden, g->n_mgau); |
| if (s->n_gauden < (uint32)g->n_mgau) |
| E_ERROR("Senones use fewer codebooks (%d) than present (%d)\n", |
| s->n_gauden, g->n_mgau); |
|
|
| msg->topn = ps_config_int(config, "topn"); |
| E_INFO("The value of topn: %d\n", msg->topn); |
| if (msg->topn == 0 || msg->topn > msg->g->n_density) { |
| E_WARN |
| ("-topn argument (%d) invalid or > #density codewords (%d); set to latter\n", |
| msg->topn, msg->g->n_density); |
| msg->topn = msg->g->n_density; |
| } |
|
|
| msg->dist = (gauden_dist_t ***) |
| ckd_calloc_3d(g->n_mgau, g->n_feat, msg->topn, |
| sizeof(gauden_dist_t)); |
| msg->mgau_active = ckd_calloc(g->n_mgau, sizeof(int8)); |
|
|
| mg = (ps_mgau_t *)msg; |
| mg->vt = &ms_mgau_funcs; |
| return mg; |
| error_out: |
| ms_mgau_free(ps_mgau_base(msg)); |
| return NULL; |
| } |
|
|
| void |
| ms_mgau_free(ps_mgau_t * mg) |
| { |
| ms_mgau_model_t *msg = (ms_mgau_model_t *)mg; |
| if (msg == NULL) |
| return; |
|
|
| if (msg->g) |
| gauden_free(msg->g); |
| if (msg->s) |
| senone_free(msg->s); |
| if (msg->dist) |
| ckd_free_3d((void *) msg->dist); |
| if (msg->mgau_active) |
| ckd_free(msg->mgau_active); |
| |
| ckd_free(msg); |
| } |
|
|
| int |
| ms_mgau_mllr_transform(ps_mgau_t *s, |
| ps_mllr_t *mllr) |
| { |
| ms_mgau_model_t *msg = (ms_mgau_model_t *)s; |
| return gauden_mllr_transform(msg->g, mllr, msg->config); |
| } |
|
|
| int32 |
| ms_cont_mgau_frame_eval(ps_mgau_t * mg, |
| int16 *senscr, |
| uint8 *senone_active, |
| int32 n_senone_active, |
| mfcc_t ** feat, |
| int32 frame, |
| int32 compallsen) |
| { |
| ms_mgau_model_t *msg = (ms_mgau_model_t *)mg; |
| int32 gid; |
| int32 topn; |
| int32 best; |
| gauden_t *g; |
| senone_t *sen; |
|
|
| (void)frame; |
| topn = ms_mgau_topn(msg); |
| g = ms_mgau_gauden(msg); |
| sen = ms_mgau_senone(msg); |
|
|
| if (compallsen) { |
| int32 s; |
|
|
| for (gid = 0; gid < g->n_mgau; gid++) |
| gauden_dist(g, gid, topn, feat, msg->dist[gid]); |
|
|
| best = MAX_INT32; |
| for (s = 0; (uint32)s < sen->n_sen; s++) { |
| senscr[s] = senone_eval(sen, s, msg->dist[sen->mgau[s]], topn); |
| if (best > senscr[s]) { |
| best = senscr[s]; |
| } |
| } |
|
|
| |
| for (s = 0; (uint32)s < sen->n_sen; s++) { |
| int32 bs = senscr[s] - best; |
| if (bs > 32767) |
| bs = 32767; |
| if (bs < -32768) |
| bs = -32768; |
| senscr[s] = bs; |
| } |
| } |
| else { |
| int32 i, n; |
| |
| for (gid = 0; gid < g->n_mgau; gid++) |
| msg->mgau_active[gid] = 0; |
|
|
| n = 0; |
| for (i = 0; i < n_senone_active; i++) { |
| |
| int32 s = senone_active[i] + n; |
| msg->mgau_active[sen->mgau[s]] = 1; |
| n = s; |
| } |
|
|
| |
| for (gid = 0; gid < g->n_mgau; gid++) { |
| if (msg->mgau_active[gid]) |
| gauden_dist(g, gid, topn, feat, msg->dist[gid]); |
| } |
|
|
| best = MAX_INT32; |
| n = 0; |
| for (i = 0; i < n_senone_active; i++) { |
| int32 s = senone_active[i] + n; |
| senscr[s] = senone_eval(sen, s, msg->dist[sen->mgau[s]], topn); |
| if (best > senscr[s]) { |
| best = senscr[s]; |
| } |
| n = s; |
| } |
|
|
| |
| n = 0; |
| for (i = 0; i < n_senone_active; i++) { |
| int32 s = senone_active[i] + n; |
| int32 bs = senscr[s] - best; |
| if (bs > 32767) |
| bs = 32767; |
| if (bs < -32768) |
| bs = -32768; |
| senscr[s] = bs; |
| n = s; |
| } |
| } |
|
|
| return 0; |
| } |
|
|