gonglinyuan
/

metro_t0pp_largepp

@@ -16,7 +16,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 8
   - task:
       type: natural-language-inference
     dataset:
@@ -26,7 +26,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 3
   - task:
       type: natural-language-inference
     dataset:
@@ -35,7 +35,7 @@ model-index:
       split: dev_r1
     metrics:
       - type: accuracy
-        value: .
   - task:
       type: natural-language-inference
     dataset:
@@ -44,7 +44,7 @@ model-index:
       split: dev_r2
     metrics:
       - type: accuracy
-        value: 6
   - task:
       type: natural-language-inference
     dataset:
@@ -53,7 +53,7 @@ model-index:
       split: dev_r3
     metrics:
       - type: accuracy
-        value: 8
   - task:
       type: coreference-resolution
     dataset:
@@ -63,7 +63,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 2
   - task:
       type: coreference-resolution
     dataset:
@@ -73,7 +73,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 3
   - task:
       type: multiple-choice-qa
     dataset:
@@ -83,7 +83,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 1
   - task:
       type: multiple-choice-qa
     dataset:
@@ -93,7 +93,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 0
   - task:
       type: multiple-choice-qa
     dataset:
@@ -102,7 +102,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 4
   - task:
       type: word-sense-disambiguation
     dataset:
@@ -112,7 +112,7 @@ model-index:
       split: validation
     metrics:
       - type: accuracy
-        value: 6
 ---
 Official repository: https://github.com/gonglinyuan/metro_t0

       split: validation
     metrics:
       - type: accuracy
+        value: 83.68231046931406
   - task:
       type: natural-language-inference
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 74.8809523809524
   - task:
       type: natural-language-inference
     dataset:
       split: dev_r1
     metrics:
       - type: accuracy
+        value: 46.84
   - task:
       type: natural-language-inference
     dataset:
       split: dev_r2
     metrics:
       - type: accuracy
+        value: 40.373333333333335
   - task:
       type: natural-language-inference
     dataset:
       split: dev_r3
     metrics:
       - type: accuracy
+        value: 44.949999999999996
   - task:
       type: coreference-resolution
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 71.82692307692307
   - task:
       type: coreference-resolution
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 62.74664561957379
   - task:
       type: multiple-choice-qa
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 92.625
   - task:
       type: multiple-choice-qa
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 95.64938535542491
   - task:
       type: multiple-choice-qa
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 83.74327823142801
   - task:
       type: word-sense-disambiguation
     dataset:
       split: validation
     metrics:
       - type: accuracy
+        value: 70.4858934169279
 ---
 Official repository: https://github.com/gonglinyuan/metro_t0