evaluation
Browse files
README.md
CHANGED
@@ -11,7 +11,21 @@ datasets:
|
|
11 |
- mozilla-foundation/common_voice_8_0
|
12 |
model-index:
|
13 |
- name: wav2vec2-xls-r-300m-gn-cv8
|
14 |
-
results:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
15 |
---
|
16 |
|
17 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
11 |
- mozilla-foundation/common_voice_8_0
|
12 |
model-index:
|
13 |
- name: wav2vec2-xls-r-300m-gn-cv8
|
14 |
+
results:
|
15 |
+
- task:
|
16 |
+
name: Automatic Speech Recognition
|
17 |
+
type: automatic-speech-recognition
|
18 |
+
dataset:
|
19 |
+
name: Common Voice 8
|
20 |
+
type: mozilla-foundation/common_voice_8_0
|
21 |
+
args: pt
|
22 |
+
metrics:
|
23 |
+
- name: Test WER
|
24 |
+
type: wer
|
25 |
+
value: 69.05
|
26 |
+
- name: Test CER
|
27 |
+
type: cer
|
28 |
+
value: 14.70
|
29 |
---
|
30 |
|
31 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
eval.py
ADDED
@@ -0,0 +1,137 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
#!/usr/bin/env python3
|
2 |
+
import argparse
|
3 |
+
import re
|
4 |
+
from typing import Dict
|
5 |
+
|
6 |
+
import torch
|
7 |
+
from datasets import Audio, Dataset, load_dataset, load_metric
|
8 |
+
|
9 |
+
from transformers import AutoFeatureExtractor, pipeline
|
10 |
+
|
11 |
+
|
12 |
+
def log_results(result: Dataset, args: Dict[str, str]):
|
13 |
+
"""DO NOT CHANGE. This function computes and logs the result metrics."""
|
14 |
+
|
15 |
+
log_outputs = args.log_outputs
|
16 |
+
dataset_id = "_".join(args.dataset.split("/") + [args.config, args.split])
|
17 |
+
|
18 |
+
# load metric
|
19 |
+
wer = load_metric("wer")
|
20 |
+
cer = load_metric("cer")
|
21 |
+
|
22 |
+
# compute metrics
|
23 |
+
wer_result = wer.compute(references=result["target"], predictions=result["prediction"])
|
24 |
+
cer_result = cer.compute(references=result["target"], predictions=result["prediction"])
|
25 |
+
|
26 |
+
# print & log results
|
27 |
+
result_str = f"WER: {wer_result}\n" f"CER: {cer_result}"
|
28 |
+
print(result_str)
|
29 |
+
|
30 |
+
with open(f"{dataset_id}_eval_results.txt", "w") as f:
|
31 |
+
f.write(result_str)
|
32 |
+
|
33 |
+
# log all results in text file. Possibly interesting for analysis
|
34 |
+
if log_outputs is not None:
|
35 |
+
pred_file = f"log_{dataset_id}_predictions.txt"
|
36 |
+
target_file = f"log_{dataset_id}_targets.txt"
|
37 |
+
|
38 |
+
with open(pred_file, "w") as p, open(target_file, "w") as t:
|
39 |
+
|
40 |
+
# mapping function to write output
|
41 |
+
def write_to_file(batch, i):
|
42 |
+
p.write(f"{i}" + "\n")
|
43 |
+
p.write(batch["prediction"] + "\n")
|
44 |
+
t.write(f"{i}" + "\n")
|
45 |
+
t.write(batch["target"] + "\n")
|
46 |
+
|
47 |
+
result.map(write_to_file, with_indices=True)
|
48 |
+
|
49 |
+
|
50 |
+
def normalize_text(text: str) -> str:
|
51 |
+
"""DO ADAPT FOR YOUR USE CASE. this function normalizes the target text."""
|
52 |
+
|
53 |
+
chars_to_ignore_regex = '[,?.!\-\;\:"“%‘”�—’…–]' # noqa: W605 IMPORTANT: this should correspond to the chars that were ignored during training
|
54 |
+
|
55 |
+
text = re.sub(chars_to_ignore_regex, "", text.lower())
|
56 |
+
|
57 |
+
# In addition, we can normalize the target text, e.g. removing new lines characters etc...
|
58 |
+
# note that order is important here!
|
59 |
+
token_sequences_to_ignore = ["\n\n", "\n", " ", " "]
|
60 |
+
|
61 |
+
for t in token_sequences_to_ignore:
|
62 |
+
text = " ".join(text.split(t))
|
63 |
+
|
64 |
+
return text
|
65 |
+
|
66 |
+
|
67 |
+
def main(args):
|
68 |
+
# load dataset
|
69 |
+
dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True)
|
70 |
+
|
71 |
+
# for testing: only process the first two examples as a test
|
72 |
+
# dataset = dataset.select(range(10))
|
73 |
+
|
74 |
+
# load processor
|
75 |
+
feature_extractor = AutoFeatureExtractor.from_pretrained(args.model_id)
|
76 |
+
sampling_rate = feature_extractor.sampling_rate
|
77 |
+
|
78 |
+
# resample audio
|
79 |
+
dataset = dataset.cast_column("audio", Audio(sampling_rate=sampling_rate))
|
80 |
+
|
81 |
+
# load eval pipeline
|
82 |
+
if args.device is None:
|
83 |
+
args.device = 0 if torch.cuda.is_available() else -1
|
84 |
+
asr = pipeline("automatic-speech-recognition", model=args.model_id, device=args.device, feature_extractor=feature_extractor)
|
85 |
+
|
86 |
+
# map function to decode audio
|
87 |
+
def map_to_pred(batch):
|
88 |
+
prediction = asr(
|
89 |
+
batch["audio"]["array"], chunk_length_s=args.chunk_length_s, stride_length_s=args.stride_length_s
|
90 |
+
)
|
91 |
+
|
92 |
+
batch["prediction"] = prediction["text"]
|
93 |
+
batch["target"] = normalize_text(batch["sentence"])
|
94 |
+
return batch
|
95 |
+
|
96 |
+
# run inference on all examples
|
97 |
+
result = dataset.map(map_to_pred, remove_columns=dataset.column_names)
|
98 |
+
|
99 |
+
# compute and log_results
|
100 |
+
# do not change function below
|
101 |
+
log_results(result, args)
|
102 |
+
|
103 |
+
|
104 |
+
if __name__ == "__main__":
|
105 |
+
parser = argparse.ArgumentParser()
|
106 |
+
|
107 |
+
parser.add_argument(
|
108 |
+
"--model_id", type=str, required=True, help="Model identifier. Should be loadable with 🤗 Transformers"
|
109 |
+
)
|
110 |
+
parser.add_argument(
|
111 |
+
"--dataset",
|
112 |
+
type=str,
|
113 |
+
required=True,
|
114 |
+
help="Dataset name to evaluate the `model_id`. Should be loadable with 🤗 Datasets",
|
115 |
+
)
|
116 |
+
parser.add_argument(
|
117 |
+
"--config", type=str, required=True, help="Config of the dataset. *E.g.* `'en'` for Common Voice"
|
118 |
+
)
|
119 |
+
parser.add_argument("--split", type=str, required=True, help="Split of the dataset. *E.g.* `'test'`")
|
120 |
+
parser.add_argument(
|
121 |
+
"--chunk_length_s", type=float, default=None, help="Chunk length in seconds. Defaults to 5 seconds."
|
122 |
+
)
|
123 |
+
parser.add_argument(
|
124 |
+
"--stride_length_s", type=float, default=None, help="Stride of the audio chunks. Defaults to 1 second."
|
125 |
+
)
|
126 |
+
parser.add_argument(
|
127 |
+
"--log_outputs", action="store_true", help="If defined, write outputs to log file for analysis."
|
128 |
+
)
|
129 |
+
parser.add_argument(
|
130 |
+
"--device",
|
131 |
+
type=int,
|
132 |
+
default=None,
|
133 |
+
help="The device to run the pipeline on. -1 for CPU (default), 0 for the first GPU and so on.",
|
134 |
+
)
|
135 |
+
args = parser.parse_args()
|
136 |
+
|
137 |
+
main(args)
|
eval.sh
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
python3 eval.py --model_id ./ --dataset mozilla-foundation/common_voice_8_0 --config gn --split test --log_outputs
|
log_mozilla-foundation_common_voice_8_0_gn_test_predictions.txt
ADDED
@@ -0,0 +1,318 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
0
|
2 |
+
kóva ipukóta
|
3 |
+
1
|
4 |
+
nacheko'eporãi
|
5 |
+
2
|
6 |
+
ikatéva haichapiĩva
|
7 |
+
3
|
8 |
+
ijeike políticape
|
9 |
+
4
|
10 |
+
aikuaa amanótaha
|
11 |
+
5
|
12 |
+
ha hi'ariete ndaje ohepyi mbe'ẽ hikuái chupe
|
13 |
+
6
|
14 |
+
koʼag̃aite ndaikatui ahecha ndeve
|
15 |
+
7
|
16 |
+
ikaambýgui ojeja pokesu
|
17 |
+
8
|
18 |
+
eipyhýpe ajaka ha tereko ejogua ñandéve ipokueterãiñakangue
|
19 |
+
9
|
20 |
+
ohenduvo umi mba'e ña mariao porandujeýkuri
|
21 |
+
10
|
22 |
+
aru uma ñanerentã kavaju
|
23 |
+
11
|
24 |
+
oñoty ylyguipe kavo ra'ỹi
|
25 |
+
12
|
26 |
+
chy 'año che rógape
|
27 |
+
13
|
28 |
+
cheve roguarã oĩporã
|
29 |
+
14
|
30 |
+
aporanduichaangirũme ha nandekuaái
|
31 |
+
15
|
32 |
+
vetárã oikove
|
33 |
+
16
|
34 |
+
naha ʼéi vaicha henda
|
35 |
+
17
|
36 |
+
hetilopoétiko oipurúva
|
37 |
+
18
|
38 |
+
ha hesereikumandára ha aveikuratepeĩ
|
39 |
+
19
|
40 |
+
upeva ha óere avei imaymátapisa uoñoogñareko porã itayrahaitajyrakuérare
|
41 |
+
20
|
42 |
+
tereho koág̃a pya'aike
|
43 |
+
21
|
44 |
+
haʼéi omondo apymembykuéra mboaeheaópe
|
45 |
+
22
|
46 |
+
ekove hohembiapokue
|
47 |
+
23
|
48 |
+
kasonimonde'u pyhare
|
49 |
+
24
|
50 |
+
ndekera seraha
|
51 |
+
25
|
52 |
+
ivahéhi la situ
|
53 |
+
26
|
54 |
+
ojaguamascáda ha patélma ndiro
|
55 |
+
27
|
56 |
+
pyhareo u jeypi ojahu ho'u ho'uva ha oñenóõke
|
57 |
+
28
|
58 |
+
oñomongetakyre'ỹhaipa haitépe katu ombojoaju hikuái hekove
|
59 |
+
29
|
60 |
+
iñirũnguéra oñemondoipa ha py'aréipeko osẽ ohopa heseve ikotýpekuéra
|
61 |
+
30
|
62 |
+
añembotavýnte ha ndaʼéi mbaʼe vete che rembirekope
|
63 |
+
31
|
64 |
+
moõjeý pa oime reho
|
65 |
+
32
|
66 |
+
oguahẽvo ogaípe omombeu ohechavaʼekue
|
67 |
+
33
|
68 |
+
peteĩ tava'ípe oikova'ekue ñakame ha inemby kalo
|
69 |
+
34
|
70 |
+
mitãmi ha mitãrusúrõ
|
71 |
+
35
|
72 |
+
ndetavy
|
73 |
+
36
|
74 |
+
omanopove che mbarakajamiojuka avei vare'águi angujape
|
75 |
+
37
|
76 |
+
araka'eve nombotovei avavépe
|
77 |
+
38
|
78 |
+
ña mbojojava'erã
|
79 |
+
39
|
80 |
+
ha'ekóera niko oikova'ekue ñepyrũrámi itakyrýpe
|
81 |
+
40
|
82 |
+
ami rejahéi avavéridentevoi haʼégui upe ereje a póva
|
83 |
+
41
|
84 |
+
tereho porainte
|
85 |
+
42
|
86 |
+
hembiapokue itatu ombohesape'a tadayguápe
|
87 |
+
43
|
88 |
+
mitãrusu hemyhéẽva pokavyha kerayvotyeta poarãgui
|
89 |
+
44
|
90 |
+
epu'ã ha eñepyrujey
|
91 |
+
45
|
92 |
+
oñemboatypajeíkuri ihikuái
|
93 |
+
46
|
94 |
+
mborevirape
|
95 |
+
47
|
96 |
+
javinéte oguerekóva
|
97 |
+
48
|
98 |
+
cheʼeremánoe laʼipuravéva
|
99 |
+
49
|
100 |
+
mba'érepa re'use eira
|
101 |
+
50
|
102 |
+
hekovepaha omanomboype
|
103 |
+
51
|
104 |
+
peteĩ ára je ña nderu outujamiramo oguatávo yvape ári
|
105 |
+
52
|
106 |
+
eguerumina ché vechevosa rejukuevo
|
107 |
+
53
|
108 |
+
tólao ñemoñarõ
|
109 |
+
54
|
110 |
+
mba'éichapa héra nde ragaugua
|
111 |
+
55
|
112 |
+
ohoreĩngo heseve hikuái
|
113 |
+
56
|
114 |
+
jahechángo hogagua apehapépeauku'e
|
115 |
+
57
|
116 |
+
oñepyrũkuri ojo'o hoho oimoaaỹre ojuhu hikuái peteĩ kuña rete kanguekue
|
117 |
+
58
|
118 |
+
mboha pyve ijavo moarotĩ lehege guapyhína tapeykepe
|
119 |
+
59
|
120 |
+
mba'érepa naporandói chupe mavapahae
|
121 |
+
60
|
122 |
+
ña maria niko upepeguavoíkuri
|
123 |
+
61
|
124 |
+
py'ỹintei amañajey hesei
|
125 |
+
62
|
126 |
+
upéi ijára ohecha chupe ha'ipochy
|
127 |
+
63
|
128 |
+
ñemosã ha ãpe hapependereraha
|
129 |
+
64
|
130 |
+
oipokuaa ha oipykua tuichami hitajýra ha kalaícuive rocpe
|
131 |
+
65
|
132 |
+
mokõinko tymi ha peteĩ nkátaypy
|
133 |
+
66
|
134 |
+
mávape piko taita
|
135 |
+
67
|
136 |
+
néi mandu'anpei itúva haisyre
|
137 |
+
68
|
138 |
+
che nañe'ẽi guaranime
|
139 |
+
69
|
140 |
+
paraguái guyeraite
|
141 |
+
70
|
142 |
+
ág̃anteko ajava'erã laprisésare
|
143 |
+
71
|
144 |
+
bua'uhápente oinupã chupe
|
145 |
+
72
|
146 |
+
mba'épa raeijapova'erã reiko pukuche'õ
|
147 |
+
73
|
148 |
+
po'aa ndaja chokói
|
149 |
+
74
|
150 |
+
ha upépe oikópe kaoruguachu
|
151 |
+
75
|
152 |
+
opu'a jave ohohagua oguerúi mbaʼe
|
153 |
+
76
|
154 |
+
ma'ymave apysápe oike nomarandu
|
155 |
+
77
|
156 |
+
raulpéña ha omboaeha otelamáicpegua
|
157 |
+
78
|
158 |
+
ho 'u paite
|
159 |
+
79
|
160 |
+
ohasa jey peteĩ arapokoimby
|
161 |
+
80
|
162 |
+
oñaty
|
163 |
+
81
|
164 |
+
peĩ guahẽ
|
165 |
+
82
|
166 |
+
ami ndnoede nde'eireg̃o nenaiha ndejuku
|
167 |
+
83
|
168 |
+
aguy je
|
169 |
+
84
|
170 |
+
ypa'ũ rera
|
171 |
+
85
|
172 |
+
peteĩ tapepo'i puku opahápe ojogapókuri karaípoli karpo
|
173 |
+
86
|
174 |
+
ko ára niko hi'aramboty
|
175 |
+
87
|
176 |
+
nahesakaete chupe
|
177 |
+
88
|
178 |
+
ñe'ẽrã
|
179 |
+
89
|
180 |
+
ejapopu'ẽke reja povymbími
|
181 |
+
90
|
182 |
+
kojupi tendo tarapi
|
183 |
+
91
|
184 |
+
petrimo oñooitériko
|
185 |
+
92
|
186 |
+
avei oipuru ypyratã ha hu'ye
|
187 |
+
93
|
188 |
+
oveve áera ha á'era ñanereta tuisiakuejaveve
|
189 |
+
94
|
190 |
+
vya teoñeime
|
191 |
+
95
|
192 |
+
ndaéichapa ojehechakuaa
|
193 |
+
96
|
194 |
+
cheramoi oguapyva tatajerere
|
195 |
+
97
|
196 |
+
hekoreory ha imorangatúva
|
197 |
+
98
|
198 |
+
imembykóérape jepe ojaʼo upehaguere
|
199 |
+
99
|
200 |
+
peteĩ pyhare oguahe oúvo cheryvy peteĩn
|
201 |
+
100
|
202 |
+
imatakue ha ta
|
203 |
+
101
|
204 |
+
amirioĩjeýma iche ro'ape
|
205 |
+
102
|
206 |
+
peteĩ jatepoguachúpe katu oñembopopurma ndi'o
|
207 |
+
103
|
208 |
+
omivo tatu iporãvéntema
|
209 |
+
104
|
210 |
+
ejúpe itakóreri
|
211 |
+
105
|
212 |
+
aiñe'ĩ inglesikémi
|
213 |
+
106
|
214 |
+
kova ivaéi he'i imembykuru ruva
|
215 |
+
107
|
216 |
+
pemitãkuña omongaru umymbakuérape
|
217 |
+
108
|
218 |
+
ha oja'ojeyhag̃ua chupeojapohague rehesepeica
|
219 |
+
109
|
220 |
+
ta upéicha
|
221 |
+
110
|
222 |
+
oreko mokõi resasaʼyju
|
223 |
+
111
|
224 |
+
dojoguaiete isýpe
|
225 |
+
112
|
226 |
+
ha sypáma ha okuerajeýma hikuái
|
227 |
+
113
|
228 |
+
oñeguahẽ hagua
|
229 |
+
114
|
230 |
+
mba'apo na ñande'apoíri
|
231 |
+
115
|
232 |
+
mate oho'upaite cheterere
|
233 |
+
116
|
234 |
+
oĩ ojajaova'ekue oipururiavañe'ẽ
|
235 |
+
117
|
236 |
+
avei ykaraipyrékuruchumimi ha tataindy
|
237 |
+
118
|
238 |
+
karaicveréíra ombosako i irambosarã
|
239 |
+
119
|
240 |
+
añuakakuaa ndéve
|
241 |
+
120
|
242 |
+
terehupytyvy 'apamẽ
|
243 |
+
121
|
244 |
+
ombojeguapa ha ombohorýko ñareretã
|
245 |
+
122
|
246 |
+
cheroha yhuháicha ndaipotái cherayhu
|
247 |
+
123
|
248 |
+
ña nderu taneñongatoipópe
|
249 |
+
124
|
250 |
+
ka'arupytũvo omanóma katu
|
251 |
+
125
|
252 |
+
ko'ẽrvareko peteĩ aranducha uka
|
253 |
+
126
|
254 |
+
he'icheve ambyengovia hag̃ua peteĩ tesapeha pyahúvare
|
255 |
+
127
|
256 |
+
chengvaha ta chupe pyha rekue
|
257 |
+
128
|
258 |
+
hembiapo teete
|
259 |
+
129
|
260 |
+
irũnguéra
|
261 |
+
130
|
262 |
+
peteñ ára ovahẽmborika resýi peteĩ oga'i peve
|
263 |
+
131
|
264 |
+
ko'ág̃a oĩhámerijeta
|
265 |
+
132
|
266 |
+
upéi ñarembosa ta ñandegutope
|
267 |
+
133
|
268 |
+
aguahẽvo hẽnondépeajuhu iñipytuha
|
269 |
+
134
|
270 |
+
upépe katu iñarovéintema hendive mitã karialkúéra
|
271 |
+
135
|
272 |
+
peteĩ ára omañnosõpy'a upéi karai rembireko
|
273 |
+
136
|
274 |
+
mbohapy arahaguépe ntaje
|
275 |
+
137
|
276 |
+
irundy mondaha ojlapókuri hembiapovai molackue jerere
|
277 |
+
138
|
278 |
+
ama opororo yvytu reheve
|
279 |
+
139
|
280 |
+
ha veto'ipentevoi ojekuaave chupe
|
281 |
+
140
|
282 |
+
ichy omanókuriha 'e heñoirõ guare
|
283 |
+
141
|
284 |
+
peteĩ jey ñantoñavaka porã peteĩ iko'ẽ omarno
|
285 |
+
142
|
286 |
+
nochẽĩvaavoi upégui
|
287 |
+
143
|
288 |
+
anére ovepichahele
|
289 |
+
144
|
290 |
+
ipa'ũme hoĩ avei
|
291 |
+
145
|
292 |
+
hose okañu yvyrakutépe
|
293 |
+
146
|
294 |
+
imembykuera katu omendárehe ohopahhikuái
|
295 |
+
147
|
296 |
+
ndéve yemaña cherechioe
|
297 |
+
148
|
298 |
+
upéguintema ojeraháma chupe kuaretélpe
|
299 |
+
149
|
300 |
+
araváingohaiñipytũ ñepyrũma
|
301 |
+
150
|
302 |
+
upépyhare pukukueniko okyha peichajey iko'ẽ
|
303 |
+
151
|
304 |
+
tahaeha'épa eñembojakuaa che rajýrendape
|
305 |
+
152
|
306 |
+
aiko porã
|
307 |
+
153
|
308 |
+
teta sambyhýpe
|
309 |
+
154
|
310 |
+
mbo'úta ovale
|
311 |
+
155
|
312 |
+
hesu niko tuparaʼy
|
313 |
+
156
|
314 |
+
taguatoruichá niko pehekoverosandéva gyrakuerahesegua'apytépe
|
315 |
+
157
|
316 |
+
hetaitereirasa hoika hikuái ha mamope ndojuhúi mitã'i akãhratãme
|
317 |
+
158
|
318 |
+
ha ndoipotáivoi ha'e omenaoipohanu kava'ekue inosésiape
|
log_mozilla-foundation_common_voice_8_0_gn_test_targets.txt
ADDED
@@ -0,0 +1,318 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
0
|
2 |
+
kóva ipukúta
|
3 |
+
1
|
4 |
+
nacheko'ẽporãi
|
5 |
+
2
|
6 |
+
ikatéva ha ichapĩva
|
7 |
+
3
|
8 |
+
ijeike políticape
|
9 |
+
4
|
10 |
+
aikuaa amanotaha
|
11 |
+
5
|
12 |
+
ha hi'ariete ndaje ohepyme'ẽ hikuái chupe
|
13 |
+
6
|
14 |
+
ko'ag̃aite ndaikatúi ahecha ndéve
|
15 |
+
7
|
16 |
+
ikambýgui ojejapo kesu
|
17 |
+
8
|
18 |
+
eipyhy pe ajaka ha tereho ejogua ñandéve ipokue térã iñakãngue
|
19 |
+
9
|
20 |
+
ohendúvo umi mba'e ña maria oporandujeýikuri
|
21 |
+
10
|
22 |
+
arúma ñane renda kavaju
|
23 |
+
11
|
24 |
+
oñotỹ yvyguýpe ka'avo ra'ỹi
|
25 |
+
12
|
26 |
+
cheaño che rógape
|
27 |
+
13
|
28 |
+
chéverõ g̃uarã oĩ porã
|
29 |
+
14
|
30 |
+
aporandu che angirũme ha nandekuaái
|
31 |
+
15
|
32 |
+
tetã oikove
|
33 |
+
16
|
34 |
+
ndaha'éivaicha henda
|
35 |
+
17
|
36 |
+
estilo poético oiporúva
|
37 |
+
18
|
38 |
+
ha heseve kumanda ha avei kurapepẽ
|
39 |
+
19
|
40 |
+
upehaguére avei mayma tapicha oñangareko porã ita'ýra ha itajyrakuérare
|
41 |
+
20
|
42 |
+
¡tereho ko'ág̃a pya'éke
|
43 |
+
21
|
44 |
+
ha'e omondo imembykuéra mbo'ehaópe
|
45 |
+
22
|
46 |
+
hekove ha hembiapokue
|
47 |
+
23
|
48 |
+
káso ñemombeʼu pyhare
|
49 |
+
24
|
50 |
+
¡ndekyra che ra'a
|
51 |
+
25
|
52 |
+
ivai la situ
|
53 |
+
26
|
54 |
+
pajagua mascada ha pastel mandi'o
|
55 |
+
27
|
56 |
+
pyhare oújepi ojahu hoʼu hoʼúva ha oñeno oke
|
57 |
+
28
|
58 |
+
oñomongeta kyre'ỹ ha ipahaitépe katu ombojoaju hikuái hekove
|
59 |
+
29
|
60 |
+
iñirũnguéra oñemondyipa ha pya'épeko osẽ ohopa heseve ikotypekuéra
|
61 |
+
30
|
62 |
+
añembotavýnte ha nda'ei mba'evete che rembirekópe
|
63 |
+
31
|
64 |
+
moõjeýmapa oiméne oho
|
65 |
+
32
|
66 |
+
og̃uahẽvo oga'ípe omombe'u ohechava'ekue
|
67 |
+
33
|
68 |
+
peteĩ tava'ípe oikova'ekue ña kame ha imemby kalo
|
69 |
+
34
|
70 |
+
mitãmi ha mitãrusúrõ
|
71 |
+
35
|
72 |
+
ndetavy
|
73 |
+
36
|
74 |
+
omano mboyve che mbarakajami ojuka avei vare'águi angujápe
|
75 |
+
37
|
76 |
+
arakaʼeve nombotovéi avavépe
|
77 |
+
38
|
78 |
+
ñambojojávaʼerã
|
79 |
+
39
|
80 |
+
ha'ekuéra niko oikova'ekue ñepyrũrãme itakyrýpe
|
81 |
+
40
|
82 |
+
ani rejahéi avavére ndentevoi ha'égui upe reje'apóva
|
83 |
+
41
|
84 |
+
terehoporãite
|
85 |
+
42
|
86 |
+
hembiapokue ikatu ombohesapeʼa tavayguápe
|
87 |
+
43
|
88 |
+
mitãrusu henyhẽva pukavy ha kerayvotyeta porãgui
|
89 |
+
44
|
90 |
+
epu'ã ha eñepyrũjey
|
91 |
+
45
|
92 |
+
oñembyatypajeýkuri hikuái
|
93 |
+
46
|
94 |
+
mborevi rape
|
95 |
+
47
|
96 |
+
gabinete oguerekóva
|
97 |
+
48
|
98 |
+
che ermána la iporãvéva
|
99 |
+
49
|
100 |
+
mba'érepa re'use eíra
|
101 |
+
50
|
102 |
+
hekove paha omano mboyve
|
103 |
+
51
|
104 |
+
peteĩ áraje ñande ru ou tujamíramo oguatávo yvy ape ári
|
105 |
+
52
|
106 |
+
eguerumína chéve che vosa rejukuévo
|
107 |
+
53
|
108 |
+
toro ñemoñarõ
|
109 |
+
54
|
110 |
+
mba'éichapa héra nde rogaygua
|
111 |
+
55
|
112 |
+
ohoreíngo heseve hikuái
|
113 |
+
56
|
114 |
+
jahechángo ogaygua ápe ha pépe oku'e
|
115 |
+
57
|
116 |
+
oñepyrũkuri ojo'o ha oimo'ã'ỹre ojuhu hikuái peteĩ kuña rete kanguekue
|
117 |
+
58
|
118 |
+
mbohapyve ijao morotĩ reheve oguapýhina tape yképe
|
119 |
+
59
|
120 |
+
mba'érepa naporandúi chupe mávapa ha'e
|
121 |
+
60
|
122 |
+
ña maria niko upepeguavoíkuri
|
123 |
+
61
|
124 |
+
py'ỹinte amañajey hese
|
125 |
+
62
|
126 |
+
upéi ijára ohecha chupe ha ipochy
|
127 |
+
63
|
128 |
+
nemosã ha ápe ha pépe ndereraha
|
129 |
+
64
|
130 |
+
oipokua ha oipykua tujami itajýra ha karai riverospe
|
131 |
+
65
|
132 |
+
mokõi kotymi ha peteĩ tataypy
|
133 |
+
66
|
134 |
+
mávapepiko taita
|
135 |
+
67
|
136 |
+
naimandu'avéi itúva ha isýre
|
137 |
+
68
|
138 |
+
che nañe'ẽi guaraníme
|
139 |
+
69
|
140 |
+
paraguái guyraite
|
141 |
+
70
|
142 |
+
ág̃anteko ajava'erã la princesare
|
143 |
+
71
|
144 |
+
gua'uhápente oinupã chupe
|
145 |
+
72
|
146 |
+
mba'épa rejapova'erã reiko pukusérõ
|
147 |
+
73
|
148 |
+
poʼa ndajajokói
|
149 |
+
74
|
150 |
+
ha upépe oiko pe karuguasu
|
151 |
+
75
|
152 |
+
opu'ã jave oho hag̃ua ogueru imba'e
|
153 |
+
76
|
154 |
+
maymave apysápe oike ne marandu
|
155 |
+
77
|
156 |
+
raúl peña ha mboʼehao stella marispegua
|
157 |
+
78
|
158 |
+
houpaite
|
159 |
+
79
|
160 |
+
ohasajey peteĩ arapokõindy
|
161 |
+
80
|
162 |
+
oñotỹ
|
163 |
+
81
|
164 |
+
peg̃uahẽ
|
165 |
+
82
|
166 |
+
ani mbaʼeve nde eréva nembaʼeha ndejoko
|
167 |
+
83
|
168 |
+
aguyje
|
169 |
+
84
|
170 |
+
ypa'ũ réra
|
171 |
+
85
|
172 |
+
peteĩ tapepo'i puku opahápe ojogapókuri karai policarpo
|
173 |
+
86
|
174 |
+
ko ára niko hi'aramboty
|
175 |
+
87
|
176 |
+
nahesakãiete chupe
|
177 |
+
88
|
178 |
+
ñe'ẽrã
|
179 |
+
89
|
180 |
+
ejapopya'éke rejapóva'erã
|
181 |
+
90
|
182 |
+
ojupi tendotáramo
|
183 |
+
91
|
184 |
+
patrimonio histórico
|
185 |
+
92
|
186 |
+
avei oipuru yvyrapã ha hu'y
|
187 |
+
93
|
188 |
+
oveve ára ha ára ñane retã tuichakue javeve
|
189 |
+
94
|
190 |
+
vy'ápe oñeime
|
191 |
+
95
|
192 |
+
mba'éichapa ojehechakuaa
|
193 |
+
96
|
194 |
+
che ramói oguapýva tata jerére
|
195 |
+
97
|
196 |
+
hekorory ha imarangatúva
|
197 |
+
98
|
198 |
+
imembykuérape jepe oja'o upehaguére
|
199 |
+
99
|
200 |
+
peteĩ pyhare og̃uahẽ oúvo che ryvy peteĩ
|
201 |
+
100
|
202 |
+
imatakue hatã
|
203 |
+
101
|
204 |
+
nahániri oĩjeýma che rógape
|
205 |
+
102
|
206 |
+
peteĩ japepo guasúpe katu oñembopupu mandi'o
|
207 |
+
103
|
208 |
+
umíva katu iporãvéntema
|
209 |
+
104
|
210 |
+
ejúpy jaterere
|
211 |
+
105
|
212 |
+
oñe'ẽ inglés ñe'ẽme
|
213 |
+
106
|
214 |
+
kóva ivai he'i imemby kururúva
|
215 |
+
107
|
216 |
+
pe mitãkuña omongaru mymbakuérape
|
217 |
+
108
|
218 |
+
ha oja'ojey hag̃ua chupe ojapohaguére hese péicha
|
219 |
+
109
|
220 |
+
taupéicha
|
221 |
+
110
|
222 |
+
oreko mokõi resa sa'yju
|
223 |
+
111
|
224 |
+
ndojoguaiete isýpe
|
225 |
+
112
|
226 |
+
hasypáma ha okuerajeýma hikuái
|
227 |
+
113
|
228 |
+
oñeg̃uahẽ hag̃ua
|
229 |
+
114
|
230 |
+
mba'apo nañande'apo'íri
|
231 |
+
115
|
232 |
+
mateo houpaite che terere
|
233 |
+
116
|
234 |
+
oĩ ojejaʼovaʼekue oipurúre avañeʼẽ
|
235 |
+
117
|
236 |
+
avei ykaraipyre kurusumimi ha tataindy
|
237 |
+
118
|
238 |
+
karai ferreira ombosako'i irambosarã
|
239 |
+
119
|
240 |
+
añuã kakuaa ndéve
|
241 |
+
120
|
242 |
+
terehupyty vy'apavẽ
|
243 |
+
121
|
244 |
+
ombojeguapa ha ombohory ko ñane retã
|
245 |
+
122
|
246 |
+
che rohayhuháicha ndaipotái nde cherayhu
|
247 |
+
123
|
248 |
+
ñande ru taneñongatu ipópe
|
249 |
+
124
|
250 |
+
ka'arupytũvo omanóma katu
|
251 |
+
125
|
252 |
+
ko'ẽrõ areko peteĩ aranduchauka
|
253 |
+
126
|
254 |
+
he'i chéve amyengovia hag̃ua peteĩ tesapeha pyahúvare
|
255 |
+
127
|
256 |
+
chéngo aháta chupe pyharekue
|
257 |
+
128
|
258 |
+
hembiapo teete
|
259 |
+
129
|
260 |
+
¡irũnguéra
|
261 |
+
130
|
262 |
+
peteĩ ára og̃uahẽ mburika rysýi peteĩ oga'i peve
|
263 |
+
131
|
264 |
+
ko'ág̃a oĩháme villeta
|
265 |
+
132
|
266 |
+
upéi ñarambosáta ñande gustope
|
267 |
+
133
|
268 |
+
ag̃uahẽvo henondépe ajuhu iñipytũha
|
269 |
+
134
|
270 |
+
upépe katu iñarõvéntema hendive mitãkaria'ykuéra
|
271 |
+
135
|
272 |
+
peteĩ ára omanósapy'a upe karai rembireko
|
273 |
+
136
|
274 |
+
mbohapy ára haguépe ndaje
|
275 |
+
137
|
276 |
+
irundy mondaha ojapókuri hembiapo vai molaskue jerére
|
277 |
+
138
|
278 |
+
ama opororo yvytu reheve
|
279 |
+
139
|
280 |
+
ha beto'ípentevoi ojekuaave chupe
|
281 |
+
140
|
282 |
+
isy omanókuri ha'e heñoirõguare
|
283 |
+
141
|
284 |
+
peteĩ jey ña antonia vaka porã peteĩ iko'ẽ omano
|
285 |
+
142
|
286 |
+
nosẽivavoi upégui
|
287 |
+
143
|
288 |
+
ani re'uve pizza helen
|
289 |
+
144
|
290 |
+
ipa'ũme oĩ avei
|
291 |
+
145
|
292 |
+
josé okañy yvyra kupépe
|
293 |
+
146
|
294 |
+
imembykuéra katu omenda rehe ohopa hikuái
|
295 |
+
147
|
296 |
+
nde remaña cherehe
|
297 |
+
148
|
298 |
+
upéguintema ojeraháma chupe cuartelpe
|
299 |
+
149
|
300 |
+
ara vaíngo ha iñipytũñepyrũma
|
301 |
+
150
|
302 |
+
upe pyhare pukukue niko oky ha péicha jey iko'ẽ
|
303 |
+
151
|
304 |
+
taha'eha'éva peñembojakuaa che rajy rendápe
|
305 |
+
152
|
306 |
+
aiko porã
|
307 |
+
153
|
308 |
+
tetã sãmbyhýpe
|
309 |
+
154
|
310 |
+
mboýpa ovale
|
311 |
+
155
|
312 |
+
hesúniko tupã ra'y
|
313 |
+
156
|
314 |
+
taguato ruvicha niko pe hekoverosãvéva guyrakuéra hesegua apytépe
|
315 |
+
157
|
316 |
+
hetaitereirasa oheka hikuái ha mamove ndojuhúi mitã'i akãhatãme
|
317 |
+
158
|
318 |
+
ha ndoipotáigui ha'e omenda oipohãnoukava'ekue inocenciape
|
mozilla-foundation_common_voice_8_0_gn_test_eval_results.txt
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
WER: 0.6905487804878049
|
2 |
+
CER: 0.1470525187566988
|