ESPnet
multilingual
audio
universa
ftshijt's picture
Update model
21a6355
srmr
language
nisqa_mos_pred
nisqa_noi_pred
nisqa_dis_pred
nisqa_col_pred
nisqa_loud_pred
sheet_ssqa
utmos
utmosv2
dns_overall
dns_p808
plcmos
singmos
scoreq_nr
se_sdr
se_sar
se_si_snr
se_ci_sdr
pam_score
speaking_rate
audiobox_aesthetics_CE
audiobox_aesthetics_CU
audiobox_aesthetics_PC
audiobox_aesthetics_PQ
asvspoof_score
real_language
qwen_speaker_count
qwen_speaker_gender
qwen_speaker_age
qwen_speech_impairment
qwen_voice_pitch
qwen_pitch_range
qwen_voice_type
qwen_speech_volume_level
qwen_language
qwen_speech_register
qwen_vocabulary_complexity
qwen_speech_purpose
qwen_speech_emotion
qwen_speech_clarity
qwen_speech_rate
qwen_speaking_style
qwen_laughter_crying
qwen_speech_background_environment
qwen_recording_quality
qwen_channel_type
snr_simulation
rir_room_size
nomad
emotion_similarity
noresqa_score
speech_bert
speech_bleu
speech_token_distance
scoreq_ref
asr_match_error_rate
ref_text_length
pred_text_length
spk_similarity
rt60
visqol
pysepm_fwsegsnr
pysepm_llr
pysepm_wss
pysepm_cd
pysepm_c_sig
pysepm_c_bak
pysepm_c_ovl
pysepm_csii_high
pysepm_csii_mid
pysepm_csii_low
pysepm_ncm
mcd
f0rmse
f0corr
pesq
stoi
sdr
sar
si_snr
ci_sdr
nisqa_real_mos
wer
cer
urgent_mos
voicemos_real_mos