Spaces:

evaluate-metric
/

xtreme_s

Running

App Files Files Community

lvwerra HF staff commited on Sep 22, 2022

Commit

9b085fb

1 Parent(s): 5929372

Update Space (evaluate main: e4a27243)

Browse files

Files changed (2) hide show

requirements.txt +1 -1
xtreme_s.py +20 -7

requirements.txt CHANGED Viewed

	@@ -1,2 +1,2 @@
1	- git+https://github.com/huggingface/evaluate@~~80448674f5447a9682afe051db243c4a13bfe4ff~~
2	sklearn


1	+ git+https://github.com/huggingface/evaluate@e4a2724377909fe2aeb4357e3971e5a569673b39
2	sklearn

xtreme_s.py CHANGED Viewed

@@ -13,7 +13,8 @@
 # limitations under the License.
 """ XTREME-S benchmark metric. """
-from typing import List
 import datasets
 from datasets.config import PY_VERSION
@@ -218,11 +219,22 @@ def wer_and_cer(preds, labels, concatenate_texts, config_name):
         return {"wer": compute_score(preds, labels, "wer"), "cer": compute_score(preds, labels, "cer")}
 @evaluate.utils.file_utils.add_start_docstrings(_DESCRIPTION, _KWARGS_DESCRIPTION)
 class XtremeS(evaluate.Metric):
-    def _info(self):
-        if self.config_name not in _CONFIG_NAMES:
-            raise KeyError(f"You should supply a configuration name selected in {_CONFIG_NAMES}")
         pred_type = "int64" if self.config_name in ["fleurs-lang_id", "minds14"] else "string"
@@ -230,6 +242,7 @@ class XtremeS(evaluate.Metric):
             description=_DESCRIPTION,
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
             features=datasets.Features(
                 {"predictions": datasets.Value(pred_type), "references": datasets.Value(pred_type)}
             ),
@@ -238,10 +251,10 @@ class XtremeS(evaluate.Metric):
             format="numpy",
         )
-    def _compute(self, predictions, references, bleu_kwargs=None, wer_kwargs=None):
-        bleu_kwargs = bleu_kwargs if bleu_kwargs is not None else {}
-        wer_kwargs = wer_kwargs if wer_kwargs is not None else {}
         if self.config_name == "fleurs-lang_id":
             return {"accuracy": simple_accuracy(predictions, references)}

 # limitations under the License.
 """ XTREME-S benchmark metric. """
+from dataclasses import dataclass
+from typing import List, Optional
 import datasets
 from datasets.config import PY_VERSION
         return {"wer": compute_score(preds, labels, "wer"), "cer": compute_score(preds, labels, "cer")}
+@dataclass
+class XtremeSConfig(evaluate.info.Config):
+    name: str = "default"
+    bleu_kwargs: Optional[dict] = None
+    wer_kwargs: Optional[dict] = None
 @evaluate.utils.file_utils.add_start_docstrings(_DESCRIPTION, _KWARGS_DESCRIPTION)
 class XtremeS(evaluate.Metric):
+    CONFIG_CLASS = XtremeSConfig
+    ALLOWED_CONFIG_NAMES = _CONFIG_NAMES
+    def _info(self, config):
         pred_type = "int64" if self.config_name in ["fleurs-lang_id", "minds14"] else "string"
             description=_DESCRIPTION,
             citation=_CITATION,
             inputs_description=_KWARGS_DESCRIPTION,
+            config=config,
             features=datasets.Features(
                 {"predictions": datasets.Value(pred_type), "references": datasets.Value(pred_type)}
             ),
             format="numpy",
         )
+    def _compute(self, predictions, references):
+        bleu_kwargs = self.config.bleu_kwargs if self.config.bleu_kwargs is not None else {}
+        wer_kwargs = self.config.wer_kwargs if self.config.wer_kwargs is not None else {}
         if self.config_name == "fleurs-lang_id":
             return {"accuracy": simple_accuracy(predictions, references)}