陈俊杰
commited on
Commit
•
f51ed55
1
Parent(s):
5cd297d
cjj:gpt-4o
Browse files
app.py
CHANGED
@@ -245,7 +245,7 @@ elif page == "LeaderBoard":
|
|
245 |
""", unsafe_allow_html=True)
|
246 |
df = {
|
247 |
"TeamId": ["baseline", "baseline", "baseline", "baseline"],
|
248 |
-
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o
|
249 |
"Average (all 4 datatsets)": [],
|
250 |
"Average (Dialogue Generation)": [],
|
251 |
"Accuracy (Dialogue Generation)": [],
|
@@ -268,7 +268,7 @@ elif page == "LeaderBoard":
|
|
268 |
# teamId 唯一标识码
|
269 |
DG = {
|
270 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
271 |
-
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o
|
272 |
"Accuracy": [0.5806, 0.5483, 0.6001, 0.6472],
|
273 |
"Kendall's Tau": [0.3243, 0.1739, 0.3042, 0.4167],
|
274 |
"Spearman": [0.3505, 0.1857, 0.3264, 0.4512]
|
@@ -277,7 +277,7 @@ elif page == "LeaderBoard":
|
|
277 |
|
278 |
TE = {
|
279 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
280 |
-
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o
|
281 |
"Accuracy": [0.5107, 0.5050, 0.5461, 0.5581],
|
282 |
"Kendall's Tau": [0.1281, 0.0635, 0.2716, 0.3864],
|
283 |
"Spearman": [0.1352, 0.0667, 0.2867, 0.4157]
|
@@ -286,7 +286,7 @@ elif page == "LeaderBoard":
|
|
286 |
|
287 |
SG = {
|
288 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
289 |
-
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o
|
290 |
"Accuracy": [0.6504, 0.6014, 0.7162, 0.7441],
|
291 |
"Kendall's Tau": [0.3957, 0.2688, 0.5092, 0.5001],
|
292 |
"Spearman": [0.4188, 0.2817, 0.5403, 0.5405],
|
@@ -295,7 +295,7 @@ elif page == "LeaderBoard":
|
|
295 |
|
296 |
NFQA = {
|
297 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
298 |
-
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o
|
299 |
"Accuracy": [0.5935, 0.5817, 0.7000, 0.7203],
|
300 |
"Kendall's Tau": [0.2332, 0.2389, 0.4440, 0.4235],
|
301 |
"Spearman": [0.2443, 0.2492, 0.4630, 0.4511]
|
|
|
245 |
""", unsafe_allow_html=True)
|
246 |
df = {
|
247 |
"TeamId": ["baseline", "baseline", "baseline", "baseline"],
|
248 |
+
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o"],
|
249 |
"Average (all 4 datatsets)": [],
|
250 |
"Average (Dialogue Generation)": [],
|
251 |
"Accuracy (Dialogue Generation)": [],
|
|
|
268 |
# teamId 唯一标识码
|
269 |
DG = {
|
270 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
271 |
+
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o"],
|
272 |
"Accuracy": [0.5806, 0.5483, 0.6001, 0.6472],
|
273 |
"Kendall's Tau": [0.3243, 0.1739, 0.3042, 0.4167],
|
274 |
"Spearman": [0.3505, 0.1857, 0.3264, 0.4512]
|
|
|
277 |
|
278 |
TE = {
|
279 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
280 |
+
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o"],
|
281 |
"Accuracy": [0.5107, 0.5050, 0.5461, 0.5581],
|
282 |
"Kendall's Tau": [0.1281, 0.0635, 0.2716, 0.3864],
|
283 |
"Spearman": [0.1352, 0.0667, 0.2867, 0.4157]
|
|
|
286 |
|
287 |
SG = {
|
288 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
289 |
+
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o"],
|
290 |
"Accuracy": [0.6504, 0.6014, 0.7162, 0.7441],
|
291 |
"Kendall's Tau": [0.3957, 0.2688, 0.5092, 0.5001],
|
292 |
"Spearman": [0.4188, 0.2817, 0.5403, 0.5405],
|
|
|
295 |
|
296 |
NFQA = {
|
297 |
"TeamId": ["baseline1", "baseline2", "baseline3", "baseline4"],
|
298 |
+
"Methods": ["chatglm3-6b", "baichuan2-13b", "chatglm-pro", "gpt-4o"],
|
299 |
"Accuracy": [0.5935, 0.5817, 0.7000, 0.7203],
|
300 |
"Kendall's Tau": [0.2332, 0.2389, 0.4440, 0.4235],
|
301 |
"Spearman": [0.2443, 0.2492, 0.4630, 0.4511]
|