Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator
#7
by
autoevaluator
HF staff
- opened
README.md
CHANGED
@@ -5,12 +5,12 @@ license: mit
|
|
5 |
tags:
|
6 |
- text-classification
|
7 |
- zero-shot-classification
|
8 |
-
metrics:
|
9 |
-
- accuracy
|
10 |
datasets:
|
11 |
- multi_nli
|
12 |
- anli
|
13 |
- fever
|
|
|
|
|
14 |
pipeline_tag: zero-shot-classification
|
15 |
model-index:
|
16 |
- name: MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli
|
@@ -24,50 +24,61 @@ model-index:
|
|
24 |
config: plain_text
|
25 |
split: test_r3
|
26 |
metrics:
|
27 |
-
-
|
28 |
-
type: accuracy
|
29 |
value: 0.495
|
|
|
30 |
verified: true
|
31 |
-
|
32 |
-
|
33 |
value: 0.4984740618243923
|
|
|
34 |
verified: true
|
35 |
-
|
36 |
-
|
37 |
value: 0.495
|
|
|
38 |
verified: true
|
39 |
-
|
40 |
-
|
41 |
value: 0.4984357572868885
|
|
|
42 |
verified: true
|
43 |
-
|
44 |
-
|
45 |
value: 0.49461028192371476
|
|
|
46 |
verified: true
|
47 |
-
|
48 |
-
|
49 |
value: 0.495
|
|
|
50 |
verified: true
|
51 |
-
|
52 |
-
|
53 |
value: 0.495
|
|
|
54 |
verified: true
|
55 |
-
|
56 |
-
|
57 |
value: 0.4942810999491704
|
|
|
58 |
verified: true
|
59 |
-
|
60 |
-
|
61 |
value: 0.495
|
|
|
62 |
verified: true
|
63 |
-
|
64 |
-
|
65 |
value: 0.4944671868893595
|
|
|
66 |
verified: true
|
67 |
-
|
68 |
-
|
69 |
value: 1.8788293600082397
|
|
|
70 |
verified: true
|
|
|
71 |
- task:
|
72 |
type: natural-language-inference
|
73 |
name: Natural Language Inference
|
@@ -77,50 +88,61 @@ model-index:
|
|
77 |
config: plain_text
|
78 |
split: test_r1
|
79 |
metrics:
|
80 |
-
-
|
81 |
-
type: accuracy
|
82 |
value: 0.712
|
|
|
83 |
verified: true
|
84 |
-
|
85 |
-
|
86 |
value: 0.7134839439315348
|
|
|
87 |
verified: true
|
88 |
-
|
89 |
-
|
90 |
value: 0.712
|
|
|
91 |
verified: true
|
92 |
-
|
93 |
-
|
94 |
value: 0.7134676028447461
|
|
|
95 |
verified: true
|
96 |
-
|
97 |
-
|
98 |
value: 0.7119814425203647
|
|
|
99 |
verified: true
|
100 |
-
|
101 |
-
|
102 |
value: 0.712
|
|
|
103 |
verified: true
|
104 |
-
|
105 |
-
|
106 |
value: 0.712
|
|
|
107 |
verified: true
|
108 |
-
|
109 |
-
|
110 |
value: 0.7119226991285647
|
|
|
111 |
verified: true
|
112 |
-
|
113 |
-
|
114 |
value: 0.712
|
|
|
115 |
verified: true
|
116 |
-
|
117 |
-
|
118 |
value: 0.7119242267218338
|
|
|
119 |
verified: true
|
120 |
-
|
121 |
-
|
122 |
value: 1.0105403661727905
|
|
|
123 |
verified: true
|
|
|
124 |
- task:
|
125 |
type: natural-language-inference
|
126 |
name: Natural Language Inference
|
@@ -130,50 +152,61 @@ model-index:
|
|
130 |
config: default
|
131 |
split: validation_mismatched
|
132 |
metrics:
|
133 |
-
-
|
134 |
-
type: accuracy
|
135 |
value: 0.902766476810415
|
|
|
136 |
verified: true
|
137 |
-
|
138 |
-
|
139 |
value: 0.9023816542652491
|
|
|
140 |
verified: true
|
141 |
-
|
142 |
-
|
143 |
value: 0.902766476810415
|
|
|
144 |
verified: true
|
145 |
-
|
146 |
-
|
147 |
value: 0.9034597464719761
|
|
|
148 |
verified: true
|
149 |
-
|
150 |
-
|
151 |
value: 0.9024304801555488
|
|
|
152 |
verified: true
|
153 |
-
|
154 |
-
|
155 |
value: 0.902766476810415
|
|
|
156 |
verified: true
|
157 |
-
|
158 |
-
|
159 |
value: 0.902766476810415
|
|
|
160 |
verified: true
|
161 |
-
|
162 |
-
|
163 |
value: 0.9023086094638595
|
|
|
164 |
verified: true
|
165 |
-
|
166 |
-
|
167 |
value: 0.902766476810415
|
|
|
168 |
verified: true
|
169 |
-
|
170 |
-
|
171 |
value: 0.9030161011457231
|
|
|
172 |
verified: true
|
173 |
-
|
174 |
-
|
175 |
value: 0.3283354640007019
|
|
|
176 |
verified: true
|
|
|
177 |
- task:
|
178 |
type: natural-language-inference
|
179 |
name: Natural Language Inference
|
@@ -183,50 +216,61 @@ model-index:
|
|
183 |
config: plain_text
|
184 |
split: dev_r1
|
185 |
metrics:
|
186 |
-
-
|
187 |
-
type: accuracy
|
188 |
value: 0.737
|
|
|
189 |
verified: true
|
190 |
-
|
191 |
-
|
192 |
value: 0.737681071614645
|
|
|
193 |
verified: true
|
194 |
-
|
195 |
-
|
196 |
value: 0.737
|
|
|
197 |
verified: true
|
198 |
-
|
199 |
-
|
200 |
value: 0.7376755842752241
|
|
|
201 |
verified: true
|
202 |
-
|
203 |
-
|
204 |
value: 0.7369675064285843
|
|
|
205 |
verified: true
|
206 |
-
|
207 |
-
|
208 |
value: 0.737
|
|
|
209 |
verified: true
|
210 |
-
|
211 |
-
|
212 |
value: 0.737
|
|
|
213 |
verified: true
|
214 |
-
|
215 |
-
|
216 |
value: 0.7366853496239583
|
|
|
217 |
verified: true
|
218 |
-
|
219 |
-
|
220 |
value: 0.737
|
|
|
221 |
verified: true
|
222 |
-
|
223 |
-
|
224 |
value: 0.7366990292378379
|
|
|
225 |
verified: true
|
226 |
-
|
227 |
-
|
228 |
value: 0.9349392056465149
|
|
|
229 |
verified: true
|
|
|
230 |
---
|
231 |
# DeBERTa-v3-base-mnli-fever-anli
|
232 |
## Model description
|
|
|
5 |
tags:
|
6 |
- text-classification
|
7 |
- zero-shot-classification
|
|
|
|
|
8 |
datasets:
|
9 |
- multi_nli
|
10 |
- anli
|
11 |
- fever
|
12 |
+
metrics:
|
13 |
+
- accuracy
|
14 |
pipeline_tag: zero-shot-classification
|
15 |
model-index:
|
16 |
- name: MoritzLaurer/DeBERTa-v3-base-mnli-fever-anli
|
|
|
24 |
config: plain_text
|
25 |
split: test_r3
|
26 |
metrics:
|
27 |
+
- type: accuracy
|
|
|
28 |
value: 0.495
|
29 |
+
name: Accuracy
|
30 |
verified: true
|
31 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYWViYjQ5YTZlYjU4NjQyN2NhOTVhNjFjNGQyMmFiNmQyZjRkOTdhNzJmNjc3NGU4MmY0MjYyMzY5MjZhYzE0YiIsInZlcnNpb24iOjF9.S8pIQ7gEGokd_wKXMi6Bc3B2DThIP3cvVkTFErZ-2JxXTSCy1TBuulY3dzGfaiP7kTHbL52OuBhG_-wb7Ue9DQ
|
32 |
+
- type: precision
|
33 |
value: 0.4984740618243923
|
34 |
+
name: Precision Macro
|
35 |
verified: true
|
36 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOTllZDU3NmVmYjk4ZmYzNjAwNzExMGZjNDMzOWRkZjRjMTRhNzhlZmI0ZmNlM2E0Mzk4OWE5NTM5MTYyYWU5NCIsInZlcnNpb24iOjF9.WHz_TUJgPVn-rU-9vBCDdmSMOuWzADwr09rJY6ktqRM46zytbyWs7Vcm7jqDrTkfU-rp0_7IyoNv_xEsKhJbBA
|
37 |
+
- type: precision
|
38 |
value: 0.495
|
39 |
+
name: Precision Micro
|
40 |
verified: true
|
41 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjllODE3ZjUxZDhiMTI0MzZmYjY5OTUwYWI2OTc4ZjJhNTVjMjY2ODdkMmJlZjQ5YWQ1Mjk2ZThmYjJlM2RlYSIsInZlcnNpb24iOjF9.a9V06-O7l9S0Bv4vj0aard8128SAP61DZdXl_3XqdmNgt_C6KAoDBVueF2M2kF_kT6lRfEz6YW0ACIfJNXDYAA
|
42 |
+
- type: precision
|
43 |
value: 0.4984357572868885
|
44 |
+
name: Precision Weighted
|
45 |
verified: true
|
46 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjhiMzYzY2JiMmYwN2YxYzEwZTQ3NGI1NzFmMzliNjJkMDE2YzI5Njg1ZjEzMGIxODdiMDNmYmI4Y2Y2MmJkMiIsInZlcnNpb24iOjF9.xvZZaUMogw9MJjb3ls6h5liDlTqHMmNgqk6KbyDqQWfCcD255brCU3Xo6nECwaChS4te0dQu_iWGBqR_o2kYAA
|
47 |
+
- type: recall
|
48 |
value: 0.49461028192371476
|
49 |
+
name: Recall Macro
|
50 |
verified: true
|
51 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDVjYTEzOTI0ZjVhOTk3ZTkzZmZhNTk5ODcxMWJhYWU4ZTRjYWVhNzcwOWY5YmI2NGFlYWE4NjM5MDY5NTExOSIsInZlcnNpb24iOjF9.xgHCB2rbCQBzHzUokw4u8JyOdhtF4yvPv1t8t7YiEkaAuM5MAPsVuCZ1VtlLapHS_IWetlocizsVl6akjh3cAQ
|
52 |
+
- type: recall
|
53 |
value: 0.495
|
54 |
+
name: Recall Micro
|
55 |
verified: true
|
56 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYTEyYmM0ZDQ0M2RiMDNhNjIxNzQ4OWZiNTBiOTAwZDFkNjNmYjBhNjA4NmQ0NjFkNmNiZTljNDkxNDg3NzIyYSIsInZlcnNpb24iOjF9.3FJPwNtwgFNvMjVxVAayaVXXR1sWlr0sqAYmXzmMzMxl7IJh6RS77dGPwFaqD3jamLVBiqPn9wsfz5lFK5yTAA
|
57 |
+
- type: recall
|
58 |
value: 0.495
|
59 |
+
name: Recall Weighted
|
60 |
verified: true
|
61 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmY1MjZlZTQ4OTg5YzdlYmFhZDMzMmNlNjNkYmIyZGI4M2NjZjQ1ZDVkNmZkMTUxNjI3M2UwZmI1MDM1NDYwOSIsInZlcnNpb24iOjF9.cnbM6xjTLRa9z0wEDGd_Q4lTXVLRKIQ6_YLGLjf-t7Nto4lzxAeWF-RrwA0Mq9OPITlJq2Jk1Eg_0Utb13d9Dg
|
62 |
+
- type: f1
|
63 |
value: 0.4942810999491704
|
64 |
+
name: F1 Macro
|
65 |
verified: true
|
66 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2U3NGM1MDM4YTM4NzQxMGM4ZTIyZDM2YTQ1MGNlZWM1MzEzM2MxN2ZmZmRmYTM0OWJmZGJjYjM5OWEzMmZjNSIsInZlcnNpb24iOjF9.vMtge1F-tmMn9D3aVUuwcNEXjqpNgEyHAl9f5UDSoTYcOgTwi2vi5yRGRCl8y6Fx7BtgaCwMyoZVNbP5-GRtCA
|
67 |
+
- type: f1
|
68 |
value: 0.495
|
69 |
+
name: F1 Micro
|
70 |
verified: true
|
71 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjBjMTQ5MmQ5OGE5OWJjZGMyNzg4N2RmNDUzMzQ5Zjc4ZTc4N2JlMTk0MTc2M2RjZTgzOTNlYWQzODAwNDI0NCIsInZlcnNpb24iOjF9.yxXG0CNWW8__xJC14BjbTY9QkXD75x6uCIXR51oKDemkP0b_xGyd-A2wPIuwNJN1EYkQevPY0bhVpRWBKyO9Bg
|
72 |
+
- type: f1
|
73 |
value: 0.4944671868893595
|
74 |
+
name: F1 Weighted
|
75 |
verified: true
|
76 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzczNjQzY2FmMmY4NTAwYjNkYjJlN2I2NjI2Yjc0ZmQ3NjZiN2U5YWEwYjk4OTUyOTMzZTYyZjYzOTMzZGU2YiIsInZlcnNpb24iOjF9.mLOnst2ScPX7ZQwaUF12W2nv7-w9lX9-BxHl3-0T0gkSWnmtBSwYcL5faTX0_I5q33Fjz5tfkjpCJuxP5JYIBQ
|
77 |
+
- type: loss
|
78 |
value: 1.8788293600082397
|
79 |
+
name: loss
|
80 |
verified: true
|
81 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzRlOTYwYjU1Y2Y4ZGM0NDBjYTE2MmEzNWIwN2NiMWVkOWZlNzA2ZmQ3YjZjNzI4MjQwYWZhODIwMzU3ODAyZiIsInZlcnNpb24iOjF9._Xs9bl48MSavvp5eyamrP2iNlFWv35QZCrmWjJXLkUdIBx0ElCjEdxBb3dxPGnUxdpDzGMmOoKCPI44ZPXrtDw
|
82 |
- task:
|
83 |
type: natural-language-inference
|
84 |
name: Natural Language Inference
|
|
|
88 |
config: plain_text
|
89 |
split: test_r1
|
90 |
metrics:
|
91 |
+
- type: accuracy
|
|
|
92 |
value: 0.712
|
93 |
+
name: Accuracy
|
94 |
verified: true
|
95 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYWYxMGY0ZWU0YTEyY2I3NmQwZmQ3YmFmNzQxNGU5OGNjN2ViN2I0ZjdkYWUzM2RmYzkzMDg3ZjVmNGYwNGZkZCIsInZlcnNpb24iOjF9.snWBusAeo1rrQqWk--vTxb-CBcFqM298YCtwTQGBZiFegKGSTSKzj-SM6HMNsmoQWmMuv7UfYPqYlnzEthOSAg
|
96 |
+
- type: precision
|
97 |
value: 0.7134839439315348
|
98 |
+
name: Precision Macro
|
99 |
verified: true
|
100 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNjMxMjg1Y2QwNzMwM2ZkNGM3ZTJhOGJmY2FkNGI1ZTFhOGQ3ODViNTJmZTYwMWJkZDYyYWRjMzFmZDI1NTM5YSIsInZlcnNpb24iOjF9.ZJnY6zYOBn-YEtN7uKzQ-VKXPwlIO1zq19Yuo37vBJNSs1dGDd8f1jgfdZuA19e_wA3Nc5nQKe9VXRwPHPgwAQ
|
101 |
+
- type: precision
|
102 |
value: 0.712
|
103 |
+
name: Precision Micro
|
104 |
verified: true
|
105 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZWM4YWQyODBlYTIwMWQxZDA1NmY1M2M2ODgwNDJiY2RhMDVhYTlkMDUzZTJkMThkYzRmNDg2YTdjMjczNGUwOCIsInZlcnNpb24iOjF9.SogsKHdbdlEs05IBYwXvlnaC_esg-DXAPc2KPRyHaVC5ItVHbxa63NpybSpao4baOoMlLG9aRe7TjG4gtB2dAQ
|
106 |
+
- type: precision
|
107 |
value: 0.7134676028447461
|
108 |
+
name: Precision Weighted
|
109 |
verified: true
|
110 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODdjMzFkM2IwNWZiM2I4ZWViMmQ4NWM5MDY5ZWQxZjc1MGRmNjhmNzJhYWFmOWEwMjg3ZjhiZWM3YjlhOTIxNSIsInZlcnNpb24iOjF9._0JNIbiqLuDZrp_vrCljBe28xexZJPmigLyhkcO8AtH2VcNxWshwCpZuRF4bqvpMvnApJeuGMf3vXjCj0MC1Bw
|
111 |
+
- type: recall
|
112 |
value: 0.7119814425203647
|
113 |
+
name: Recall Macro
|
114 |
verified: true
|
115 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYjU4MWEyMzkyYzg1ZTIxMTc0M2NhMTgzOGEyZmY5OTg3M2Q1ZmMwNmU3ZmU1ZjA1MDk0OGZkMzM5NDVlZjBlNSIsInZlcnNpb24iOjF9.sZ3GTcmGGthpTLL7_Zovq8aBmE3Dp_PZi5v8ZI9yG9N6B_GjWvBuPC8ENXK1NwmwiHLsSvtKTG5JmAum-su0Dg
|
116 |
+
- type: recall
|
117 |
value: 0.712
|
118 |
+
name: Recall Micro
|
119 |
verified: true
|
120 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDg3NGViZTlmMWM2ZDNhMzIzZGZkYWZhODQxNzg2MjNiNjQ0Zjg0NjQ1OWZkY2I5ODdiY2Y3Y2JjNzRmYjJkMiIsInZlcnNpb24iOjF9.bCZUzJamsozKWehnNph6E5coww5zZTrJdbWevWrSyfT0PyXc_wkZ-NKdyBAoqprBz3_8L3i5hPM6Qsy56b4BDA
|
121 |
+
- type: recall
|
122 |
value: 0.712
|
123 |
+
name: Recall Weighted
|
124 |
verified: true
|
125 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMDk1MDJiOGUzZThlZjJjMzY4NjMzODFiZjUzZmIwMjIxY2UwNzBiN2IxMWEwMGJjZTkxODA0YzUxZDE3ODRhOCIsInZlcnNpb24iOjF9.z0dqvB3aBVYt3xRIb_M4svWebfQc0QaDFVFzHnlA5QGEHkHOW3OecGhHE4EzBqTDI3DASWZTGMjrMDDt0uOMBw
|
126 |
+
- type: f1
|
127 |
value: 0.7119226991285647
|
128 |
+
name: F1 Macro
|
129 |
verified: true
|
130 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiM2U0YjMwNzhmOTEyNDZhODU3MTU0YTM4MmQ0NzEzNWI1YjY0ZWQ3MWRiMTdiNTUzNWRkZThjMWE4M2NkZmI0MiIsInZlcnNpb24iOjF9.hhj1BXkuWi9wXrCjT9NwqaPETtOoYNiyqYsJEw-ufA8A4hVThKA6ZBtma1Q_M65-DZFfPEBDBNASLZ7EPSbmDw
|
131 |
+
- type: f1
|
132 |
value: 0.712
|
133 |
+
name: F1 Micro
|
134 |
verified: true
|
135 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODk0Y2EyMzc5M2ZlNWFlNDg2Zjc1OTQxNGY3YjA5YjUxYTYzZjRlZmU4ODYxNjA3ZjkxNGUzYjBmNmMxMzY5YiIsInZlcnNpb24iOjF9.DvKk-3hNh2LhN2ug5e0FgUntL3Ozdfl06Kz7jvmB-deOJH6INi2a2ZySXoEePoo8t2nR6ENFYu9QjMA2ojnpCA
|
136 |
+
- type: f1
|
137 |
value: 0.7119242267218338
|
138 |
+
name: F1 Weighted
|
139 |
verified: true
|
140 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2MxOWFlMmI2NGRiMjkwN2Q5MWZhNDFlYzQxNWNmNzQ3OWYxZThmNDU2OWU1MTE5OGY2MWRlYWUyNDM3OTkzZCIsInZlcnNpb24iOjF9.QrTD1gE8_wRok9u59W-Mx0cX89K-h2Ad6qa8J5rmP8lc_rkG0ft2n5_GqH1CBZBJwMFYv91Pn6TuE3eGxJuUDA
|
141 |
+
- type: loss
|
142 |
value: 1.0105403661727905
|
143 |
+
name: loss
|
144 |
verified: true
|
145 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMmUwMTg4NjM3ZTBiZTIyODcyNDNmNTE5ZDZhMzNkMDMyNjcwOGQ5NmY0NTlhMjgyNmIzZjRiNDFiNjA3M2RkZSIsInZlcnNpb24iOjF9.sjBDVJV-jnygwcppmByAXpoo-Wzz178bBzozJEuYEiJaHSbk_xEevfJS1PmLUuplYslKb1iyEctnjI-5bl-XDw
|
146 |
- task:
|
147 |
type: natural-language-inference
|
148 |
name: Natural Language Inference
|
|
|
152 |
config: default
|
153 |
split: validation_mismatched
|
154 |
metrics:
|
155 |
+
- type: accuracy
|
|
|
156 |
value: 0.902766476810415
|
157 |
+
name: Accuracy
|
158 |
verified: true
|
159 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMjExZWM3YzA3ZDNlNjEwMmViNWEwZTE3MjJjNjEyNDhjOTQxNGFmMzBjZTk0ODUwYTc2OGNiZjYyMTBmNWZjZSIsInZlcnNpb24iOjF9.zbFAGrv2flpmweqS7Poxib7qHFLdW8eUTzshdOm2B9H-KWpIZCWC-P4p8TLMdNJnUcZJZ03Okil4qjIMqqIRCA
|
160 |
+
- type: precision
|
161 |
value: 0.9023816542652491
|
162 |
+
name: Precision Macro
|
163 |
verified: true
|
164 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2U2MGViNmJjNWQxNzRjOTkxNDIxZjZjNmM5YzE4ZjU5NTE5NjFlNmEzZWRlOGYxN2E3NTAwMTEwYjNhNzE0YSIsInZlcnNpb24iOjF9.WJjDJf56FROvf7Y5ShWnnxMvK_ZpQ2PibAOtSFhSiYJ7bt4TGOzMwaZ5RSTf_mcfXgRfWbXmy1jCwNhDb-5EAw
|
165 |
+
- type: precision
|
166 |
value: 0.902766476810415
|
167 |
+
name: Precision Micro
|
168 |
verified: true
|
169 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzRhZTExOTc5NDczZjI1YmMzOGYyOTU2MDU1OGE5ZTczMDE0MmU0NzZhY2YzMDI1ZGQ3MGM5MmJiODFkNzUzZiIsInZlcnNpb24iOjF9.aRYcGEI1Y8-a0d8XOoXhBgsFyj9LWNwEjoIPc594y7kJn91wXIsXoR0-_0iy3uz41mWaTTlwJx7lI-kipFDvDQ
|
170 |
+
- type: precision
|
171 |
value: 0.9034597464719761
|
172 |
+
name: Precision Weighted
|
173 |
verified: true
|
174 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMWQyMTZiZDA2OTUwZjRmNTFiMWRlZTNmOTliZmI2MWFmMjdjYzEyYTgwNzkyOTQzOTBmNTUyYjMwNTUxMTFkNiIsInZlcnNpb24iOjF9.hUtAMTl0THHUkaLcgk1Vy9IhjqJAXCJ_5STJ5A7k7s_SO9DHp3b6qusgwPmcGLYyPy1-j1dB2AIstxK4tHfmDA
|
175 |
+
- type: recall
|
176 |
value: 0.9024304801555488
|
177 |
+
name: Recall Macro
|
178 |
verified: true
|
179 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzAxZGJhNGI3ZDNlMjg2ZDIxNTgwMDY5MTFjM2ExZmIxMDBmZjUyNTliNWNkOGI0OTY3NTYyNWU3OWFlYTA3YiIsInZlcnNpb24iOjF9.1o_GNq8zmXa_50MUF_K63IDc2aUKNeUkNQ5fT592-SAo8WgiaP9Dh6bOEu2OqrpRQ57P4qm7OdJt7UKsrosMDA
|
180 |
+
- type: recall
|
181 |
value: 0.902766476810415
|
182 |
+
name: Recall Micro
|
183 |
verified: true
|
184 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjhiMWE4Yjk0ODFkZjlkYjRlMjU1OTJmMjA2Njg1N2M4MzQ0OWE3N2FlYjY4NDgxZThjMmExYWQ5OGNmYmI1NSIsInZlcnNpb24iOjF9.Gmm5lf_qpxjXWWrycDze7LHR-6WGQc62WZTmcoc5uxWd0tivEUqCAFzFdbEU1jVKxQBIyDX77CPuBm7mUA4sCg
|
185 |
+
- type: recall
|
186 |
value: 0.902766476810415
|
187 |
+
name: Recall Weighted
|
188 |
verified: true
|
189 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiY2EzZWYwNjNkYWE1YTcyZGZjNTNhMmNlNzgzYjk5MGJjOWJmZmE5NmYwM2U2NTA5ZDY3ZjFiMmRmZmQwY2QwYiIsInZlcnNpb24iOjF9.yA68rslg3e9kUR3rFTNJJTAad6Usr4uFmJvE_a7G2IvSKqLxG_pqsHszsWfg5mFBQLjWEAyCtdQYMdVayuYMBA
|
190 |
+
- type: f1
|
191 |
value: 0.9023086094638595
|
192 |
+
name: F1 Macro
|
193 |
verified: true
|
194 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMzMyMzZhNjI5MWRmZWJhMjkzN2E0MjM4ZTM5YzZmNTk5YTZmYzU4NDRiYjczZGQ4MDdhNjJiMGU0MjE3NDEwNyIsInZlcnNpb24iOjF9.RCMqH_xUMN97Vos54pTFfAMbLstXUMdFTs-eNaypbDb_Fc-MW8NLmJ6dzJsp9sSvhXyYjugjRMUpMpnQseKXDA
|
195 |
+
- type: f1
|
196 |
value: 0.902766476810415
|
197 |
+
name: F1 Micro
|
198 |
verified: true
|
199 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZTYxZTZhZGM0NThlNTAzNmYwMTA4NDNkN2FiNzhhN2RlYThlYjcxMjE5MjBkMzhiOGYxZGRmMjE0NGM2ZWQ5ZSIsInZlcnNpb24iOjF9.wRfllNw2Gibmi1keU7d_GjkyO0F9HESCgJlJ9PHGZQRRT414nnB-DyRvulHjCNnaNjXqMi0LJimC3iBrNawwAw
|
200 |
+
- type: f1
|
201 |
value: 0.9030161011457231
|
202 |
+
name: F1 Weighted
|
203 |
verified: true
|
204 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDA0YjAxMWU5MjI4MWEzNTNjMzJlNjM3ZDMxOTE0ZTZhYmZlNmUyNDViNTU2NmMyMmM3MjAxZWVjNWJmZjI4MCIsInZlcnNpb24iOjF9.vJ8aUjfTbFMc1BgNUVpoVDuYwQJYQjwZQxblkUdvSoGtkW_AzQJ_KJ8Njc7IBA3ADgj8iZHjRQNIZkFCf-xICw
|
205 |
+
- type: loss
|
206 |
value: 0.3283354640007019
|
207 |
+
name: loss
|
208 |
verified: true
|
209 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiODdmYzYzNTUzZDNmOWIxM2E0ZmUyOWUzM2Y2NGRmZDNiYjg3ZTMzYTUyNzg3OWEzNzYyN2IyNmExOGRlMWUxYSIsInZlcnNpb24iOjF9.Qv0FzFZPkcBs9aHGf4TEREX4jdkc40NazdMlP2M_-w2wHwyjoAjvhk611RLXHcbicozNelZJLnsOMdEMnPLEDg
|
210 |
- task:
|
211 |
type: natural-language-inference
|
212 |
name: Natural Language Inference
|
|
|
216 |
config: plain_text
|
217 |
split: dev_r1
|
218 |
metrics:
|
219 |
+
- type: accuracy
|
|
|
220 |
value: 0.737
|
221 |
+
name: Accuracy
|
222 |
verified: true
|
223 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMTQ1ZGVkOTVmNTlhYjhkMjVlNTNhMjNmZWFjZWZjZjcxZmRhMDVlOWI0YTdkOTMwYjVjNWFlOGY4OTc1MmRhNiIsInZlcnNpb24iOjF9.wGLgKA1E46ljbLokdPeip_UCr1gqK8iSSbsJKX2vgKuuhDdUWWiECrUFN-bv_78JWKoKW5T0GF_hb-RVDzA0AQ
|
224 |
+
- type: precision
|
225 |
value: 0.737681071614645
|
226 |
+
name: Precision Macro
|
227 |
verified: true
|
228 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYmFkMGUwMjNhN2E3NzMxNTc5NDM0MjY1MGU5ODllM2Q2YzA1MDI3OGI1ZmI4YTcxN2E4ZDk5OWY2OGNiN2I0MCIsInZlcnNpb24iOjF9.6G5qhccjheaNfasgRyrkKBTaQPRzuPMZZ0hrLxTNzAydMDgx09FkFP3hni7WLRMWp0IpwzkEeBlxV-mPyQBtBw
|
229 |
+
- type: precision
|
230 |
value: 0.737
|
231 |
+
name: Precision Micro
|
232 |
verified: true
|
233 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2QzYjQ4ZDZjOGU5YzI3YmFlMThlYTRkYTUyYWIyNzc4NDkwNzM1OWFiMTgyMzA0NDZmMGI3YTQxODBjM2EwMCIsInZlcnNpb24iOjF9.bvNWyzfct1CLJFx_EuD2GeKieVtyGJy0cwUBP2qJE1ey2i9SVn6n1Dr0AALTGBkxQ6n5-fJ61QFNufpdr2KvCA
|
234 |
+
- type: precision
|
235 |
value: 0.7376755842752241
|
236 |
+
name: Precision Weighted
|
237 |
verified: true
|
238 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2VmYWYzZWQwZmMzMDk0NTdlY2Y3NDkzYWY5ZTdmOGU0ZTUzZWE4YWFhZjVmODhkZmE1Njg4NjA5YjJmYWVhOSIsInZlcnNpb24iOjF9.50FQR2aoBpORLgYa7482ZTrRhT-KfIgv5ltBEHndUBMmqGF9Ru0LHENSGwyD_tO89sGPfiW32TxpbrNWiBdIBA
|
239 |
+
- type: recall
|
240 |
value: 0.7369675064285843
|
241 |
+
name: Recall Macro
|
242 |
verified: true
|
243 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZTM4OTAyNDYwNjY4Zjc5NDljNjBmNTg2Mzk4YjYxM2MyYTA0MDllYTMyNzEwOGI1ZTEwYWE3ZmU0NDZmZDg2NiIsInZlcnNpb24iOjF9.UvWBxuApNV3vd4hpgwqd6XPHCbkA_bB_Cw24ooquiOf0dstvjP3JvpGoDp5SniOzIOg3i2aYbcvFCLJqEXMZCQ
|
244 |
+
- type: recall
|
245 |
value: 0.737
|
246 |
+
name: Recall Micro
|
247 |
verified: true
|
248 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYmQ4MjMzNzRmNTI5NjIzNGQ0ZDFmZTA1MDU3OTk0MzYyMGI0NTMzZTZlMTQ1MDc1MzBkMGMzYjcxZjU1NDNjOSIsInZlcnNpb24iOjF9.kpbdXOpDG3CUB-kUEXsgFT3HWWIbu70wwzs2TNf0rhIuRrzdZz3dXXvwqu1BcLJTsOxl8G6NTiYXgnv-ul8lDg
|
249 |
+
- type: recall
|
250 |
value: 0.737
|
251 |
+
name: Recall Weighted
|
252 |
verified: true
|
253 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmU1ZWJkNWE0NjczY2NiZWYyNzYyMzllNzZmZTIxNWRkYTEyZDgxN2E0NTNmM2ExMTc1ZWVjMzBiYjg0ZmM1MiIsInZlcnNpb24iOjF9.S6HHWCWnut_LJqXbEA_Z8ZOTtyq6V51ZeiA0qbwzr0hapDYZOZHrN4prvSLvoNv-GiYDYKatwIsAZxCZc5fmCA
|
254 |
+
- type: f1
|
255 |
value: 0.7366853496239583
|
256 |
+
name: F1 Macro
|
257 |
verified: true
|
258 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNzkxYmY2NTcyOTE0ZDdjNGY2ZmE4MzQwMGIxZTA2MDg1NzI5YTQ0MTdkZjdkNzNkMDM2NTk2MTNiNjU4ODMwZCIsInZlcnNpb24iOjF9.ECVaCBqGd0pnQT3xJF7yWrgecIb-5TMiVWpEO0MQGhYy43snkI6Qs-2FOXzvfwIWqG-Q6XIIhGbWZh5TFEGKCA
|
259 |
+
- type: f1
|
260 |
value: 0.737
|
261 |
+
name: F1 Micro
|
262 |
verified: true
|
263 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNDMwMWZiNzQyNWEzNmMzMDJjOTAxYzAxNzc0MTNlYzRkZjllYmNjZmU0OTgzZDFkNWM1ZWI5OTA2NzE5Y2YxOSIsInZlcnNpb24iOjF9.8yZFol_Gcj9n3w9Yk5wx48yql7p3wriDecv-6VSTAB6Q_MWLQAWsCEGRRhgGJ3zvhoRehJZdb35ozk36VOinDQ
|
264 |
+
- type: f1
|
265 |
value: 0.7366990292378379
|
266 |
+
name: F1 Weighted
|
267 |
verified: true
|
268 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMjhhN2ZkMjc5ZGQ3ZGM1Nzk3ZTgwY2E1N2NjYjdhNjZlOTdhYmRlNGVjN2EwNTIzN2UyYTY2ODVlODhmY2Q4ZCIsInZlcnNpb24iOjF9.Cz7ClDAfCGpqdRTYd5v3dPjXFq8lZLXx8AX_rqmF-Jb8KocqVDsHWeZScW5I2oy951UrdMpiUOLieBuJLOmCCQ
|
269 |
+
- type: loss
|
270 |
value: 0.9349392056465149
|
271 |
+
name: loss
|
272 |
verified: true
|
273 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNmI4MTI5MDM1NjBmMzgzMzc2NjM5MzZhOGUyNTgyY2RlZTEyYTIzYzY2ZGJmODcxY2Q5OTVjOWU3OTQ2MzM1NSIsInZlcnNpb24iOjF9.bSOFnYC4Y2y2pW1AR-bgPUHKafR-0OHf8PvexK8eQLsS323Xy9-rYkKUaP09KY6_fk9GqAawv5eqj72B_uyeCA
|
274 |
---
|
275 |
# DeBERTa-v3-base-mnli-fever-anli
|
276 |
## Model description
|