Spaces:
Running
Running
Upload folder using huggingface_hub
Browse files- results/bleu/st.csv +4 -0
- results/llama3_70b_judge/ac.csv +4 -0
- results/llama3_70b_judge/aqa.csv +4 -0
- results/llama3_70b_judge/ar.csv +4 -0
- results/llama3_70b_judge/si.csv +4 -0
- results/llama3_70b_judge/sqa.csv +4 -0
- results/llama3_70b_judge_binary/er.csv +4 -0
- results/llama3_70b_judge_binary/gr.csv +4 -0
- results/llama3_70b_judge_binary/sqa.csv +4 -0
- results/meteor/ac.csv +4 -0
- results/wer/asr.csv +4 -0
- results/wer/cnasr.csv +4 -0
results/bleu/st.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,covost2_en_id_test,covost2_en_zh_test,covost2_en_ta_test,covost2_id_en_test,covost2_zh_en_test,covost2_ta_en_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,covost2_en_id_test,covost2_en_zh_test,covost2_en_ta_test,covost2_id_en_test,covost2_zh_en_test,covost2_ta_en_test
|
2 |
+
salmonn_7b,14.135708265627702,34.055681569415356,0.00045042243733421275,27.877196356747618,5.2319724257915645,0.4256092994569619
|
3 |
+
wavllm_fairseq,13.841886973016162,31.96381187282953,0.0033159224040994286,5.933522277713613,2.368659001743569,0.1695522548322915
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,,,,,,
|
5 |
+
qwen_audio_chat,4.121393814607146,15.307536203629063,0.030392249793261363,0.5089433695608178,10.019503192969147,0.018955183488794443
|
results/llama3_70b_judge/ac.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,audiocaps_test,wavcaps_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,audiocaps_test,wavcaps_test
|
2 |
+
salmonn_7b,34.372727272727275,21.15606936416185
|
3 |
+
wavllm_fairseq,6.00909090909091,6.901734104046243
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,0.10159090909090909,0.16358381502890174
|
5 |
+
qwen_audio_chat,43.82272727272727,29.248554913294797
|
results/llama3_70b_judge/aqa.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,clotho_aqa_test,audiocaps_qa_test,wavcaps_qa_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,clotho_aqa_test,audiocaps_qa_test,wavcaps_qa_test
|
2 |
+
salmonn_7b,55.75299866725899,47.02875399361022,46.25
|
3 |
+
wavllm_fairseq,43.01199466903598,29.840255591054312,26.25
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,1.4278098622834297,0.7252396166134185,0.819078947368421
|
5 |
+
qwen_audio_chat,58.196357174589075,47.98722044728435,38.68421052631579
|
results/llama3_70b_judge/ar.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,voxceleb_accent_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,voxceleb_accent_test
|
2 |
+
salmonn_7b,37.443578169881
|
3 |
+
wavllm_fairseq,37.652851867049655
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,1.9214197784160854
|
5 |
+
qwen_audio_chat,45.699630693475584
|
results/llama3_70b_judge/si.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,openhermes_audio_test,alpaca_audio_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,openhermes_audio_test,alpaca_audio_test
|
2 |
+
salmonn_7b,19.2,12.4
|
3 |
+
wavllm_fairseq,18.0,21.200000000000003
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,2.88,3.46
|
5 |
+
qwen_audio_chat,11.0,9.6
|
results/llama3_70b_judge/sqa.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,slue_p2_sqa5_test,public_sg_speech_qa_test,spoken_squad_v1
|
|
|
|
|
|
|
|
|
|
1 |
Model,slue_p2_sqa5_test,public_sg_speech_qa_test,spoken_squad_v1
|
2 |
+
salmonn_7b,78.23529411764706,56.77325581395348,
|
3 |
+
wavllm_fairseq,84.95098039215685,59.36046511627907,
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,4.2181372549019605,3.20203488372093,
|
5 |
+
qwen_audio_chat,76.12745098039215,57.47093023255814,
|
results/llama3_70b_judge_binary/er.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,iemocap_emotion_test,meld_sentiment_test,meld_emotion_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,iemocap_emotion_test,meld_sentiment_test,meld_emotion_test
|
2 |
+
salmonn_7b,21.55688622754491,41.877394636015325,33.06513409961686
|
3 |
+
wavllm_fairseq,45.90818363273453,50.076628352490424,41.0727969348659
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,,,
|
5 |
+
qwen_audio_chat,27.345309381237527,43.86973180076628,50.57471264367817
|
results/llama3_70b_judge_binary/gr.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,voxceleb_gender_test,iemocap_gender_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,voxceleb_gender_test,iemocap_gender_test
|
2 |
+
salmonn_7b,88.90028723840788,51.59680638722555
|
3 |
+
wavllm_fairseq,69.67583093967994,
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,,
|
5 |
+
qwen_audio_chat,70.55806319244974,51.796407185628745
|
results/llama3_70b_judge_binary/sqa.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,cn_college_listen_mcq_test,dream_tts_mcq_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,cn_college_listen_mcq_test,dream_tts_mcq_test
|
2 |
+
salmonn_7b,50.5063848524879,55.933089388395196
|
3 |
+
wavllm_fairseq,,
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,,
|
5 |
+
qwen_audio_chat,60.85424922941436,57.76267642446419
|
results/meteor/ac.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,audiocaps_test,wavcaps_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,audiocaps_test,wavcaps_test
|
2 |
+
salmonn_7b,,
|
3 |
+
wavllm_fairseq,,
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,,
|
5 |
+
qwen_audio_chat,,
|
results/wer/asr.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,librispeech_test_clean,librispeech_test_other,common_voice_15_en_test,peoples_speech_test,gigaspeech_test,earnings21_test,earnings22_test,tedlium3_test,tedlium3_long_form_test,imda_part1_asr_test,imda_part2_asr_test,imda_part3_asr_test,imda_part4_asr_test,imda_part5_asr_test,imda_part6_asr_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,librispeech_test_clean,librispeech_test_other,common_voice_15_en_test,peoples_speech_test,gigaspeech_test,earnings21_test,earnings22_test,tedlium3_test,tedlium3_long_form_test,imda_part1_asr_test,imda_part2_asr_test,imda_part3_asr_test,imda_part4_asr_test,imda_part5_asr_test,imda_part6_asr_test
|
2 |
+
salmonn_7b,0.555834307918663,0.4180490665254317,0.3375363911542985,0.34335568653146914,0.14226764839341272,0.2687240831119165,0.3638199574803293,0.08558958163301515,0.18386810849140223,0.1581255622670608,0.6915082052617869,0.8632952723448728,1.0998724881343125,0.7462024043822395,0.5240368577507283
|
3 |
+
wavllm_fairseq,0.02103218017882069,0.04798834811886432,0.14533325621300636,0.3792176325635977,0.15491778414546403,0.6447482518259942,0.6671766188447099,0.06621482559171073,0.4536784258110264,0.07762498393522684,0.4511070591299818,0.8449539438237986,,0.652558845214085,0.5275247040334478
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,0.01831591655034519,0.03714982881570734,0.09876543209876543,0.14540692118393275,0.09515429104337297,0.11773910240019567,0.15611126487402763,0.038146268762641496,0.04754476156709803,0.0464432592211798,0.2904141703568638,0.33025751212260873,0.5142358733382134,0.4662862470067086,0.28367569330674514
|
5 |
+
qwen_audio_chat,0.02246576376051609,0.04163277659031154,0.11645169375518152,0.30723956433545313,0.13316235845059654,0.38460383986837277,0.511809498898483,0.03995599872254356,0.45289842226555577,0.08434005911836524,0.5057046105756707,1.0992041596614108,1.3267786724597983,0.7411298037375774,0.7668393782383419
|
results/wer/cnasr.csv
CHANGED
@@ -1 +1,5 @@
|
|
1 |
Model,aishell_asr_zh_test
|
|
|
|
|
|
|
|
|
|
1 |
Model,aishell_asr_zh_test
|
2 |
+
salmonn_7b,0.8527647443131199
|
3 |
+
wavllm_fairseq,0.7054601967888183
|
4 |
+
whisper_large_v3_with_llama_3_8b_instruct,
|
5 |
+
qwen_audio_chat,0.06602522222882144
|