Spaces:

zbeloki
/

m2

Running

App Files Files Community

zbeloki commited on Nov 3, 2022

Commit

f4def17

•

1 Parent(s): f64e188

Initial version of M2 implemented

Browse files

Files changed (2) hide show

m2.py +49 -7
requirements.txt +2 -1

m2.py CHANGED Viewed

@@ -14,8 +14,10 @@
 """TODO: Add a description here."""
 import evaluate
-import datasets
 # TODO: Add BibTeX citation
 _CITATION = """\
@@ -70,9 +72,17 @@ class M2(evaluate.Metric):
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
             # This defines the format of each prediction and reference
-            features=datasets.Features({
-                'predictions': datasets.Value('int64'),
-                'references': datasets.Value('int64'),
             }),
             # Homepage of the module for documentation
             homepage="http://module.homepage",
@@ -88,8 +98,40 @@ class M2(evaluate.Metric):
     def _compute(self, predictions, references):
         """Returns the scores"""
         # TODO: Compute the different scores of the module
-        accuracy = sum(i == j for i, j in zip(predictions, references)) / len(predictions)
         return {
-            "accuracy": accuracy,
-        }

 """TODO: Add a description here."""
 import evaluate
+from datasets import Features, Sequence, Value
+import pdb
+from m2scorer import get_m2score, get_m2score_from_raw, load_m2
 # TODO: Add BibTeX citation
 _CITATION = """\
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
             # This defines the format of each prediction and reference
+            features=Features({
+                'predictions': Value(dtype='string'),
+                'references': {
+                    'source_sentence': Value(dtype='string'),
+                    'edits': Sequence({
+                        'from': Value(dtype='int32'),
+                        'to': Value(dtype='int32'),
+                        'text': [Value(dtype='string')],
+                        'aid': Value(dtype='int32'),
+                    }),
+                },
             }),
             # Homepage of the module for documentation
             homepage="http://module.homepage",
     def _compute(self, predictions, references):
         """Returns the scores"""
+        gold_data = self._features_to_gold_data(references)
         # TODO: Compute the different scores of the module
+        p, r, f = get_m2score(predictions, gold_data, tokenize=False, keep_gold=True)
         return {
+            "f0.5": f,
+            "precision": p,
+            "recall": r,
+        }
+    def _features_to_gold_data(self, features):
+        gold_data = []
+        for entry in features:
+            annotators = {}
+            edits = entry['edits']
+            for i in range(len(edits['from'])):
+                edit = (edits['from'][i], edits['to'][i], edits['text'][i])
+                if edits['aid'][i] not in annotators:
+                    annotators[edits['aid'][i]] = []
+                annotators[edits['aid'][i]].append(edit)
+            gold_data.append( (entry['source_sentence'], annotators) )
+        return gold_data
+    def load_m2_file(self, fpath):
+        data = load_m2(fpath)
+        result = []
+        for src_sent, edits_ in data:
+            edits = []
+            for aid, annotator_edits in edits_.items():
+                if len(annotator_edits) == 0:
+                    edits.append({'from': -1, 'to': -1, 'text': [''], 'aid': aid})
+                for from_, to_, text_ in annotator_edits:
+                    edits.append({'from': from_, 'to': to_, 'text': text_, 'aid': aid})
+            result.append({
+                'source_sentence': src_sent,
+                'edits': edits,
+            })
+        return result

requirements.txt CHANGED Viewed

	@@ -1 +1,2 @@
1	- git+https://github.com/huggingface/evaluate@main


1	+ git+https://github.com/huggingface/evaluate@main
2	+ git+https://github.com/zbeloki/m2scorer@master