Skip to content

Commit 070d36a

Browse files
authored
Speech specs + fix FLEURS + add additional audio dependencies (#3151)
1 parent f9c4498 commit 070d36a

File tree

5 files changed

+69
-10
lines changed

5 files changed

+69
-10
lines changed

setup.cfg

+1
Original file line numberDiff line numberDiff line change
@@ -275,6 +275,7 @@ heim =
275275

276276
audiolm =
277277
crfm-helm[openai]
278+
crfm-helm[google]
278279

279280
# For HuggingFace audio datasets
280281
soundfile~=0.12
Original file line numberDiff line numberDiff line change
@@ -1,16 +1,71 @@
11
entries: [
2+
####################################################################################################################
3+
# Auditory Perception
4+
####################################################################################################################
5+
{description: "meld_audio:model=audiolm", priority: 1}
6+
{description: "vocal_sound:model=audiolm", priority: 1}
7+
{description: "audiocaps:model=audiolm", priority: 1}
8+
9+
####################################################################################################################
10+
# Fairness
11+
####################################################################################################################
12+
13+
####################################################################################################################
14+
# Robustness
15+
####################################################################################################################
16+
217
{description: "audio_mnist:model=audiolm", priority: 1}
318

4-
# TODO: populate with the rest of the languages
5-
{description: "covost2:source_language=English,target_language=Chinese,model=audiolm", priority: 1}
19+
{description: "speech_robust_bench:subject=accented_cv,model=audiolm", priority: 1}
20+
{description: "speech_robust_bench:subject=accented_cv_es,model=audiolm", priority: 1}
21+
{description: "speech_robust_bench:subject=chime_far,model=audiolm", priority: 1}
22+
{description: "speech_robust_bench:subject=chime_near,model=audiolm", priority: 1}
23+
{description: "speech_robust_bench:subject=ami_far,model=audiolm", priority: 1}
24+
{description: "speech_robust_bench:subject=ami_near,model=audiolm", priority: 1}
25+
26+
27+
####################################################################################################################
28+
# Bias
29+
####################################################################################################################
630

7-
{description: "vocal_sound:model=audiolm", priority: 1}
31+
32+
####################################################################################################################
33+
# Multilinguality
34+
####################################################################################################################
835

936
# TODO: populate with the rest of the languages
37+
{description: "covost2:source_language=English,target_language=Chinese,model=audiolm", priority: 1}
38+
39+
# There are other languages in the multilinguality aspect
1040
{description: "multilingual_librispeech:language=Dutch,model=audiolm", priority: 1}
41+
{description: "multilingual_librispeech:language=Spanish,model=audiolm", priority: 1}
42+
{description: "multilingual_librispeech:language=Italian,model=audiolm", priority: 1}
43+
{description: "multilingual_librispeech:language=German,model=audiolm", priority: 1}
44+
{description: "multilingual_librispeech:language=French,model=audiolm", priority: 1}
45+
{description: "multilingual_librispeech:language=Portuguese,model=audiolm", priority: 1}
46+
{description: "multilingual_librispeech:language=Polish,model=audiolm", priority: 1}
1147

12-
# TODO: populate with the rest of the languages
1348
{description: "fleurs:language=Finnish,model=audiolm", priority: 1}
49+
{description: "fleurs:language=Bulgarian,model=audiolm", priority: 1}
50+
{description: "fleurs:language=Hebrew,model=audiolm", priority: 1}
51+
{description: "fleurs:language=Zulu,model=audiolm", priority: 1}
52+
{description: "fleurs:language=Bengali,model=audiolm", priority: 1}
53+
{description: "fleurs:language=Thai,model=audiolm", priority: 1}
54+
{description: "fleurs:language=Mandarin_Chinese,model=audiolm", priority: 1}
55+
56+
{description: "common_voice_15:language=English,model=audiolm", priority: 1}
57+
{description: "common_voice_15:language=Chinese_hk,model=audiolm", priority: 1}
58+
{description: "common_voice_15:language=German,model=audiolm", priority: 1}
59+
{description: "common_voice_15:language=French,model=audiolm", priority: 1}
60+
61+
####################################################################################################################
62+
# Toxicity
63+
####################################################################################################################
64+
65+
66+
####################################################################################################################
67+
# Safety
68+
####################################################################################################################
69+
1470

15-
{description: "audiocaps:model=audiolm", priority: 1}
1671
]

src/helm/benchmark/scenarios/audio_language/common_voice_15_scenario.py

+1
Original file line numberDiff line numberDiff line change
@@ -86,6 +86,7 @@ def get_instances(self, output_path: str) -> List[Instance]:
8686
name=language_category,
8787
cache_dir=output_path,
8888
split=TEST_SPLIT,
89+
trust_remote_code=True,
8990
)
9091
):
9192
local_audio_path = row["path"]

src/helm/benchmark/scenarios/audio_language/fleurs_scenario.py

+6-4
Original file line numberDiff line numberDiff line change
@@ -58,8 +58,8 @@ class FLEURSScenario(Scenario):
5858
("Burmese", "my"),
5959
("Catalan", "ca"),
6060
("Cebuano", "ceb"),
61-
("Mandarin Chinese", "cmn_hans"),
62-
("Cantonese Chinese", "yue_hant"),
61+
("Mandarin_Chinese", "cmn_hans"),
62+
("Cantonese_Chinese", "yue_hant"),
6363
("Croatian", "hr"),
6464
("Czech", "cs"),
6565
("Danish", "da"),
@@ -278,9 +278,10 @@ class FLEURSScenario(Scenario):
278278
def __init__(self, language: str) -> None:
279279
super().__init__()
280280

281-
language = language.capitalize()
282281
if language not in FLEURSScenario._FLEURS_TEST_LANG_TO_ID.keys():
283-
raise ValueError(f"Invalid language. Valid languages are: {FLEURSScenario._FLEURS_TEST_LANG_TO_ID.keys()}")
282+
raise ValueError(
283+
f"Invalid language: {language}. Valid languages are: {FLEURSScenario._FLEURS_TEST_LANG_TO_ID.keys()}"
284+
)
284285

285286
self._fleurs_lang_short_to_long = {v: k for k, v in FLEURSScenario._FLEURS_LANG_TO_ID.items()}
286287
self._fleurs_long_to_lang = {
@@ -298,6 +299,7 @@ def get_instances(self, output_path: str) -> List[Instance]:
298299
name=f"fleurs.{language_category}",
299300
cache_dir=output_path,
300301
split=TEST_SPLIT,
302+
trust_remote_code=True,
301303
)
302304
):
303305
local_audio_path = row["path"]

src/helm/benchmark/scenarios/audio_language/multilingual_librispeech_scenario.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ class MultilingualLibriSpeechScenario(Scenario):
4646
description = (
4747
"Speech recognition in 7 different languages ([Pratap et al, 2022](https://arxiv.org/abs/2012.03411))."
4848
)
49-
tags: List[str] = ["audio", "multilinguality", "regocnition"]
49+
tags: List[str] = ["audio", "multilinguality", "recognition"]
5050

5151
def __init__(self, language: str) -> None:
5252
super().__init__()

0 commit comments

Comments
 (0)