Spaces:

evaluate-metric
/

google_bleu

Running

App Files Files Community

lvwerra HF Staff commited on Sep 22, 2022

Commit

b6b5d94

1 Parent(s): 821f592

Update Space (evaluate main: c447fc8e)

Browse files

Files changed (2) hide show

google_bleu.py +11 -28
requirements.txt +1 -1

google_bleu.py CHANGED Viewed

@@ -13,8 +13,7 @@
 # limitations under the License.
 """ Google BLEU (aka GLEU) metric. """
-from dataclasses import dataclass
-from typing import Callable, Dict, List, Optional
 import datasets
 from nltk.translate import gleu_score
@@ -125,28 +124,13 @@ Examples:
 """
-@dataclass
-class GoogleBleuConfig(evaluate.info.Config):
-    name: str = "default"
-    tokenizer: Optional[Callable] = None
-    min_len: int = 1
-    max_len: int = 4
 @evaluate.utils.file_utils.add_start_docstrings(_DESCRIPTION, _KWARGS_DESCRIPTION)
 class GoogleBleu(evaluate.Metric):
-    CONFIG_CLASS = GoogleBleuConfig
-    ALLOWED_CONFIG_NAMES = ["default"]
-    def _info(self, config) -> MetricInfo:
         return evaluate.MetricInfo(
             description=_DESCRIPTION,
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
-            config=config,
             features=[
                 datasets.Features(
                     {
@@ -163,12 +147,14 @@ class GoogleBleu(evaluate.Metric):
             ],
         )
-    def _compute(self, predictions, references):
-        if self.config.tokenizer is None:
-            tokenizer = Tokenizer13a()
-        else:
-            tokenizer = self.config.tokenizer
         # if only one reference is provided make sure we still use list of lists
         if isinstance(references[0], str):
             references = [[ref] for ref in references]
@@ -177,9 +163,6 @@ class GoogleBleu(evaluate.Metric):
         predictions = [tokenizer(p) for p in predictions]
         return {
             "google_bleu": gleu_score.corpus_gleu(
-                list_of_references=references,
-                hypotheses=predictions,
-                min_len=self.config.min_len,
-                max_len=self.config.max_len,
             )
         }

 # limitations under the License.
 """ Google BLEU (aka GLEU) metric. """
+from typing import Dict, List
 import datasets
 from nltk.translate import gleu_score
 """
 @evaluate.utils.file_utils.add_start_docstrings(_DESCRIPTION, _KWARGS_DESCRIPTION)
 class GoogleBleu(evaluate.Metric):
+    def _info(self) -> MetricInfo:
         return evaluate.MetricInfo(
             description=_DESCRIPTION,
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
             features=[
                 datasets.Features(
                     {
             ],
         )
+    def _compute(
+        self,
+        predictions: List[str],
+        references: List[List[str]],
+        tokenizer=Tokenizer13a(),
+        min_len: int = 1,
+        max_len: int = 4,
+    ) -> Dict[str, float]:
         # if only one reference is provided make sure we still use list of lists
         if isinstance(references[0], str):
             references = [[ref] for ref in references]
         predictions = [tokenizer(p) for p in predictions]
         return {
             "google_bleu": gleu_score.corpus_gleu(
+                list_of_references=references, hypotheses=predictions, min_len=min_len, max_len=max_len
             )
         }

requirements.txt CHANGED Viewed

	@@ -1,2 +1,2 @@
1	- git+https://github.com/huggingface/evaluate@~~e4a2724377909fe2aeb4357e3971e5a569673b39~~
2	nltk


1	+ git+https://github.com/huggingface/evaluate@c447fc8eda9c62af501bfdc6988919571050d950
2	nltk