Commit
·
4a5ca58
1
Parent(s):
f8adc06
Update README.md
Browse files
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
split: validation
|
17 |
metrics:
|
18 |
- type: accuracy
|
19 |
-
value:
|
20 |
- task:
|
21 |
type: natural-language-inference
|
22 |
dataset:
|
@@ -26,7 +26,7 @@ model-index:
|
|
26 |
split: validation
|
27 |
metrics:
|
28 |
- type: accuracy
|
29 |
-
value:
|
30 |
- task:
|
31 |
type: natural-language-inference
|
32 |
dataset:
|
@@ -35,7 +35,7 @@ model-index:
|
|
35 |
split: dev_r1
|
36 |
metrics:
|
37 |
- type: accuracy
|
38 |
-
value: .
|
39 |
- task:
|
40 |
type: natural-language-inference
|
41 |
dataset:
|
@@ -44,7 +44,7 @@ model-index:
|
|
44 |
split: dev_r2
|
45 |
metrics:
|
46 |
- type: accuracy
|
47 |
-
value:
|
48 |
- task:
|
49 |
type: natural-language-inference
|
50 |
dataset:
|
@@ -53,7 +53,7 @@ model-index:
|
|
53 |
split: dev_r3
|
54 |
metrics:
|
55 |
- type: accuracy
|
56 |
-
value:
|
57 |
- task:
|
58 |
type: coreference-resolution
|
59 |
dataset:
|
@@ -63,7 +63,7 @@ model-index:
|
|
63 |
split: validation
|
64 |
metrics:
|
65 |
- type: accuracy
|
66 |
-
value:
|
67 |
- task:
|
68 |
type: coreference-resolution
|
69 |
dataset:
|
@@ -73,7 +73,7 @@ model-index:
|
|
73 |
split: validation
|
74 |
metrics:
|
75 |
- type: accuracy
|
76 |
-
value:
|
77 |
- task:
|
78 |
type: multiple-choice-qa
|
79 |
dataset:
|
@@ -83,7 +83,7 @@ model-index:
|
|
83 |
split: validation
|
84 |
metrics:
|
85 |
- type: accuracy
|
86 |
-
value:
|
87 |
- task:
|
88 |
type: multiple-choice-qa
|
89 |
dataset:
|
@@ -93,7 +93,7 @@ model-index:
|
|
93 |
split: validation
|
94 |
metrics:
|
95 |
- type: accuracy
|
96 |
-
value:
|
97 |
- task:
|
98 |
type: multiple-choice-qa
|
99 |
dataset:
|
@@ -102,7 +102,7 @@ model-index:
|
|
102 |
split: validation
|
103 |
metrics:
|
104 |
- type: accuracy
|
105 |
-
value:
|
106 |
- task:
|
107 |
type: word-sense-disambiguation
|
108 |
dataset:
|
@@ -112,7 +112,7 @@ model-index:
|
|
112 |
split: validation
|
113 |
metrics:
|
114 |
- type: accuracy
|
115 |
-
value:
|
116 |
---
|
117 |
|
118 |
Official repository: https://github.com/gonglinyuan/metro_t0
|
|
|
16 |
split: validation
|
17 |
metrics:
|
18 |
- type: accuracy
|
19 |
+
value: 83.68231046931406
|
20 |
- task:
|
21 |
type: natural-language-inference
|
22 |
dataset:
|
|
|
26 |
split: validation
|
27 |
metrics:
|
28 |
- type: accuracy
|
29 |
+
value: 74.8809523809524
|
30 |
- task:
|
31 |
type: natural-language-inference
|
32 |
dataset:
|
|
|
35 |
split: dev_r1
|
36 |
metrics:
|
37 |
- type: accuracy
|
38 |
+
value: 46.84
|
39 |
- task:
|
40 |
type: natural-language-inference
|
41 |
dataset:
|
|
|
44 |
split: dev_r2
|
45 |
metrics:
|
46 |
- type: accuracy
|
47 |
+
value: 40.373333333333335
|
48 |
- task:
|
49 |
type: natural-language-inference
|
50 |
dataset:
|
|
|
53 |
split: dev_r3
|
54 |
metrics:
|
55 |
- type: accuracy
|
56 |
+
value: 44.949999999999996
|
57 |
- task:
|
58 |
type: coreference-resolution
|
59 |
dataset:
|
|
|
63 |
split: validation
|
64 |
metrics:
|
65 |
- type: accuracy
|
66 |
+
value: 71.82692307692307
|
67 |
- task:
|
68 |
type: coreference-resolution
|
69 |
dataset:
|
|
|
73 |
split: validation
|
74 |
metrics:
|
75 |
- type: accuracy
|
76 |
+
value: 62.74664561957379
|
77 |
- task:
|
78 |
type: multiple-choice-qa
|
79 |
dataset:
|
|
|
83 |
split: validation
|
84 |
metrics:
|
85 |
- type: accuracy
|
86 |
+
value: 92.625
|
87 |
- task:
|
88 |
type: multiple-choice-qa
|
89 |
dataset:
|
|
|
93 |
split: validation
|
94 |
metrics:
|
95 |
- type: accuracy
|
96 |
+
value: 95.64938535542491
|
97 |
- task:
|
98 |
type: multiple-choice-qa
|
99 |
dataset:
|
|
|
102 |
split: validation
|
103 |
metrics:
|
104 |
- type: accuracy
|
105 |
+
value: 83.74327823142801
|
106 |
- task:
|
107 |
type: word-sense-disambiguation
|
108 |
dataset:
|
|
|
112 |
split: validation
|
113 |
metrics:
|
114 |
- type: accuracy
|
115 |
+
value: 70.4858934169279
|
116 |
---
|
117 |
|
118 |
Official repository: https://github.com/gonglinyuan/metro_t0
|