ESPnet
multilingual
audio
universa
ftshijt's picture
Update model
46b48bd
asr_match_error_rate
asvspoof_score
audiobox_aesthetics_CE
audiobox_aesthetics_CU
audiobox_aesthetics_PC
audiobox_aesthetics_PQ
cer
ci_sdr
dns_overall
dns_p808
emotion_similarity
f0corr
f0rmse
language
mcd
nisqa_col_pred
nisqa_dis_pred
nisqa_loud_pred
nisqa_mos_pred
nisqa_noi_pred
nisqa_real_mos
nomad
noresqa_score
pam_score
pesq
plcmos
pred_text_length
pysepm_c_bak
pysepm_cd
pysepm_c_ovl
pysepm_c_sig
pysepm_csii_high
pysepm_csii_low
pysepm_csii_mid
pysepm_fwsegsnr
pysepm_llr
pysepm_ncm
pysepm_wss
qwen_channel_type
qwen_language
qwen_laughter_crying
qwen_pitch_range
qwen_recording_quality
qwen_speaker_age
qwen_speaker_count
qwen_speaker_gender
qwen_speaking_style
qwen_speech_background_environment
qwen_speech_clarity
qwen_speech_emotion
qwen_speech_impairment
qwen_speech_purpose
qwen_speech_rate
qwen_speech_register
qwen_speech_volume_level
qwen_vocabulary_complexity
qwen_voice_pitch
qwen_voice_type
real_language
ref_text_length
rir_room_size
rt60
sar
scoreq_nr
scoreq_ref
sdr
se_ci_sdr
se_sar
se_sdr
se_si_snr
sheet_ssqa
singmos
si_snr
snr_simulation
speaking_rate
speech_bert
speech_bleu
speech_token_distance
spk_similarity
srmr
stoi
urgent_mos
utmos
utmosv2
visqol
voicemos_real_mos
wer