ESPnet
multilingual
audio
universa
File size: 1,205 Bytes
46b48bd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
asr_match_error_rate
asvspoof_score
audiobox_aesthetics_CE
audiobox_aesthetics_CU
audiobox_aesthetics_PC
audiobox_aesthetics_PQ
cer
ci_sdr
dns_overall
dns_p808
emotion_similarity
f0corr
f0rmse
language
mcd
nisqa_col_pred
nisqa_dis_pred
nisqa_loud_pred
nisqa_mos_pred
nisqa_noi_pred
nisqa_real_mos
nomad
noresqa_score
pam_score
pesq
plcmos
pred_text_length
pysepm_c_bak
pysepm_cd
pysepm_c_ovl
pysepm_c_sig
pysepm_csii_high
pysepm_csii_low
pysepm_csii_mid
pysepm_fwsegsnr
pysepm_llr
pysepm_ncm
pysepm_wss
qwen_channel_type
qwen_language
qwen_laughter_crying
qwen_pitch_range
qwen_recording_quality
qwen_speaker_age
qwen_speaker_count
qwen_speaker_gender
qwen_speaking_style
qwen_speech_background_environment
qwen_speech_clarity
qwen_speech_emotion
qwen_speech_impairment
qwen_speech_purpose
qwen_speech_rate
qwen_speech_register
qwen_speech_volume_level
qwen_vocabulary_complexity
qwen_voice_pitch
qwen_voice_type
real_language
ref_text_length
rir_room_size
rt60
sar
scoreq_nr
scoreq_ref
sdr
se_ci_sdr
se_sar
se_sdr
se_si_snr
sheet_ssqa
singmos
si_snr
snr_simulation
speaking_rate
speech_bert
speech_bleu
speech_token_distance
spk_similarity
srmr
stoi
urgent_mos
utmos
utmosv2
visqol
voicemos_real_mos
wer