Spaces:

fnvls
/

bleu_1234

Runtime error

App Files Files Community

fnvls commited on Nov 16, 2023

Commit

8bc4fde

1 Parent(s): cdd89cc

add bleu 1 2 3 4 compute

Browse files

Files changed (2) hide show

README.md +2 -2
bleu_1234.py +32 -9

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 title: bleu_1234
-datasets:
--
 tags:
 - evaluate
 - metric

 ---
 title: bleu_1234
+datasets:
+- "none"
 tags:
 - evaluate
 - metric

bleu_1234.py CHANGED Viewed

@@ -70,10 +70,20 @@ class bleu_1234(evaluate.Metric):
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
             # This defines the format of each prediction and reference
-            features=datasets.Features({
-                'predictions': datasets.Value('int64'),
-                'references': datasets.Value('int64'),
-            }),
             # Homepage of the module for documentation
             homepage="http://module.homepage",
             # Additional links to the codebase or references
@@ -84,12 +94,25 @@ class bleu_1234(evaluate.Metric):
     def _download_and_prepare(self, dl_manager):
         """Optional: download external resources useful to compute the scores"""
         # TODO: Download external resources if needed
-        pass
     def _compute(self, predictions, references):
         """Returns the scores"""
         # TODO: Compute the different scores of the module
-        accuracy = sum(i == j for i, j in zip(predictions, references)) / len(predictions)
-        return {
-            "accuracy": accuracy,
-        }

             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
             # This defines the format of each prediction and reference
+            features=[
+                datasets.Features(
+                    {
+                        "predictions": datasets.Value("string", id="sequence"),
+                        "references": datasets.Sequence(datasets.Value("string", id="sequence"), id="references"),
+                    }
+                ),
+                datasets.Features(
+                    {
+                        "predictions": datasets.Value("string", id="sequence"),
+                        "references": datasets.Value("string", id="sequence"),
+                    }
+                ),
+            ],
             # Homepage of the module for documentation
             homepage="http://module.homepage",
             # Additional links to the codebase or references
     def _download_and_prepare(self, dl_manager):
         """Optional: download external resources useful to compute the scores"""
         # TODO: Download external resources if needed
+        import torch
+        from torchmetrics.text import BLEUScore
     def _compute(self, predictions, references):
         """Returns the scores"""
         # TODO: Compute the different scores of the module
+        if isinstance(references[0], str):
+            references = [[ref] for ref in references]
+        bleu = BLEUScore()
+        bleu1 = bleu(preds, target, n_gram=1)
+        bleu2 = bleu(preds, target, n_gram=2)
+        bleu3 = bleu(preds, target, n_gram=3)
+        bleu4 = bleu(preds, target, n_gram=4)
+        output_dict = {
+            "bleu-1": bleu1,
+            "bleu-2": bleu2,
+            "bleu-3": bleu3,
+            "bleu-4": bleu4,
+        }
+        return output_dict