sjrhuschlee
commited on
Commit
•
a8eb9ab
1
Parent(s):
a99591c
Update README.md
Browse files
README.md
CHANGED
@@ -27,10 +27,10 @@ model-index:
|
|
27 |
split: validation
|
28 |
metrics:
|
29 |
- type: exact_match
|
30 |
-
value: 86.
|
31 |
name: Exact Match
|
32 |
- type: f1
|
33 |
-
value: 89.
|
34 |
name: F1
|
35 |
- task:
|
36 |
type: question-answering
|
@@ -42,10 +42,10 @@ model-index:
|
|
42 |
split: validation
|
43 |
metrics:
|
44 |
- type: exact_match
|
45 |
-
value:
|
46 |
name: Exact Match
|
47 |
- type: f1
|
48 |
-
value:
|
49 |
name: F1
|
50 |
- task:
|
51 |
type: question-answering
|
@@ -57,10 +57,10 @@ model-index:
|
|
57 |
split: validation
|
58 |
metrics:
|
59 |
- type: exact_match
|
60 |
-
value:
|
61 |
name: Exact Match
|
62 |
- type: f1
|
63 |
-
value:
|
64 |
name: F1
|
65 |
- task:
|
66 |
type: question-answering
|
@@ -72,10 +72,10 @@ model-index:
|
|
72 |
split: validation
|
73 |
metrics:
|
74 |
- type: exact_match
|
75 |
-
value:
|
76 |
name: Exact Match
|
77 |
- type: f1
|
78 |
-
value:
|
79 |
name: F1
|
80 |
- task:
|
81 |
type: question-answering
|
@@ -87,55 +87,55 @@ model-index:
|
|
87 |
split: test
|
88 |
metrics:
|
89 |
- type: exact_match
|
90 |
-
value:
|
91 |
name: Exact Match
|
92 |
- type: f1
|
93 |
-
value:
|
94 |
name: F1
|
95 |
- task:
|
96 |
type: question-answering
|
97 |
name: Question Answering
|
98 |
dataset:
|
99 |
-
name: squadshifts
|
100 |
type: squadshifts
|
101 |
config: new_wiki
|
102 |
split: test
|
103 |
metrics:
|
104 |
- type: exact_match
|
105 |
-
value:
|
106 |
name: Exact Match
|
107 |
- type: f1
|
108 |
-
value:
|
109 |
name: F1
|
110 |
- task:
|
111 |
type: question-answering
|
112 |
name: Question Answering
|
113 |
dataset:
|
114 |
-
name: squadshifts
|
115 |
type: squadshifts
|
116 |
config: nyt
|
117 |
split: test
|
118 |
metrics:
|
119 |
- type: exact_match
|
120 |
-
value:
|
121 |
name: Exact Match
|
122 |
- type: f1
|
123 |
-
value:
|
124 |
name: F1
|
125 |
- task:
|
126 |
type: question-answering
|
127 |
name: Question Answering
|
128 |
dataset:
|
129 |
-
name: squadshifts
|
130 |
type: squadshifts
|
131 |
config: reddit
|
132 |
split: test
|
133 |
metrics:
|
134 |
- type: exact_match
|
135 |
-
value:
|
136 |
name: Exact Match
|
137 |
- type: f1
|
138 |
-
value:
|
139 |
name: F1
|
140 |
---
|
141 |
|
|
|
27 |
split: validation
|
28 |
metrics:
|
29 |
- type: exact_match
|
30 |
+
value: 86.819
|
31 |
name: Exact Match
|
32 |
- type: f1
|
33 |
+
value: 89.569
|
34 |
name: F1
|
35 |
- task:
|
36 |
type: question-answering
|
|
|
42 |
split: validation
|
43 |
metrics:
|
44 |
- type: exact_match
|
45 |
+
value: 89.357
|
46 |
name: Exact Match
|
47 |
- type: f1
|
48 |
+
value: 95.060
|
49 |
name: F1
|
50 |
- task:
|
51 |
type: question-answering
|
|
|
57 |
split: validation
|
58 |
metrics:
|
59 |
- type: exact_match
|
60 |
+
value: 48.833
|
61 |
name: Exact Match
|
62 |
- type: f1
|
63 |
+
value: 62.555
|
64 |
name: F1
|
65 |
- task:
|
66 |
type: question-answering
|
|
|
72 |
split: validation
|
73 |
metrics:
|
74 |
- type: exact_match
|
75 |
+
value: 84.835
|
76 |
name: Exact Match
|
77 |
- type: f1
|
78 |
+
value: 90.245
|
79 |
name: F1
|
80 |
- task:
|
81 |
type: question-answering
|
|
|
87 |
split: test
|
88 |
metrics:
|
89 |
- type: exact_match
|
90 |
+
value: 76.722
|
91 |
name: Exact Match
|
92 |
- type: f1
|
93 |
+
value: 89.680
|
94 |
name: F1
|
95 |
- task:
|
96 |
type: question-answering
|
97 |
name: Question Answering
|
98 |
dataset:
|
99 |
+
name: squadshifts new_wiki
|
100 |
type: squadshifts
|
101 |
config: new_wiki
|
102 |
split: test
|
103 |
metrics:
|
104 |
- type: exact_match
|
105 |
+
value: 84.316
|
106 |
name: Exact Match
|
107 |
- type: f1
|
108 |
+
value: 92.967
|
109 |
name: F1
|
110 |
- task:
|
111 |
type: question-answering
|
112 |
name: Question Answering
|
113 |
dataset:
|
114 |
+
name: squadshifts nyt
|
115 |
type: squadshifts
|
116 |
config: nyt
|
117 |
split: test
|
118 |
metrics:
|
119 |
- type: exact_match
|
120 |
+
value: 86.925
|
121 |
name: Exact Match
|
122 |
- type: f1
|
123 |
+
value: 94.064
|
124 |
name: F1
|
125 |
- task:
|
126 |
type: question-answering
|
127 |
name: Question Answering
|
128 |
dataset:
|
129 |
+
name: squadshifts reddit
|
130 |
type: squadshifts
|
131 |
config: reddit
|
132 |
split: test
|
133 |
metrics:
|
134 |
- type: exact_match
|
135 |
+
value: 78.241
|
136 |
name: Exact Match
|
137 |
- type: f1
|
138 |
+
value: 89.243
|
139 |
name: F1
|
140 |
---
|
141 |
|