陈俊杰 commited on
Commit
7f6ca6e
·
1 Parent(s): 550da67
Files changed (4) hide show
  1. .DS_Store +0 -0
  2. README.md +3 -3
  3. app.py +91 -0
  4. requirements.txt +2 -0
.DS_Store ADDED
Binary file (6.15 kB). View file
 
README.md CHANGED
@@ -1,10 +1,10 @@
1
  ---
2
  title: AEOLLM
3
- emoji: 🏢
4
- colorFrom: red
5
  colorTo: green
6
  sdk: streamlit
7
- sdk_version: 1.35.0
8
  app_file: app.py
9
  pinned: false
10
  ---
 
1
  ---
2
  title: AEOLLM
3
+ emoji: 😻
4
+ colorFrom: green
5
  colorTo: green
6
  sdk: streamlit
7
+ sdk_version: 1.34.0
8
  app_file: app.py
9
  pinned: false
10
  ---
app.py ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ import pandas as pd
3
+
4
+ # CSS样式
5
+ st.markdown("""
6
+ <style>
7
+ h1 {
8
+ font-size: 2.5em; /* 标题字体大小 */
9
+ }
10
+ .stDataFrame {
11
+ font-family: Helvetica;
12
+ }
13
+ .dataframe th, .dataframe td {
14
+ width: auto;
15
+ min-width: 500px;
16
+ }
17
+ </style>
18
+ """, unsafe_allow_html=True)
19
+
20
+ # 标题
21
+ st.title('🏆AEOLLM Leaderboard')
22
+
23
+ # 描述
24
+ st.markdown("""
25
+ This leaderboard is used to show the performance of the **automatic evaluation methods of LLMs** submitted by the **AEOLLM team** on four tasks:
26
+ - Summary Generation (SG)
27
+ - Non-Factoid QA (NFQA)
28
+ - Dialogue Generation (DG)
29
+ - Text Expansion (TE).
30
+
31
+ Details of AEOLLLM can be found at the link: [https://cjj826.github.io/AEOLLM/](https://cjj826.github.io/AEOLLM/)
32
+ """, unsafe_allow_html=True)
33
+ # 创建示例数据
34
+ SG = {
35
+ "methods": ["Model A", "Model B", "Model C"],
36
+ "team": ["U1", "U2", "U3"],
37
+ "acc": [0.75, 0.64, 0.83],
38
+ "tau": [0.05, 0.28, 0.16],
39
+ "s": [0.12, 0.27, 0.18],
40
+ }
41
+ df1 = pd.DataFrame(SG)
42
+
43
+ NFQA = {
44
+ "methods": ["Model A", "Model B", "Model C"],
45
+ "team": ["U1", "U2", "U3"],
46
+ "acc": [0.75, 0.64, 0.83],
47
+ "tau": [0.05, 0.28, 0.16],
48
+ "s": [0.12, 0.27, 0.18]
49
+ }
50
+ df2 = pd.DataFrame(NFQA)
51
+
52
+ DG = {
53
+ "methods": ["Model A", "Model B", "Model C"],
54
+ "team": ["U1", "U2", "U3"],
55
+ "acc": [0.75, 0.64, 0.83],
56
+ "tau": [0.05, 0.28, 0.16],
57
+ "s": [0.12, 0.27, 0.18]
58
+ }
59
+ df3 = pd.DataFrame(DG)
60
+
61
+ TE = {
62
+ "methods": ["Model A", "Model B", "Model C"],
63
+ "team": ["U1", "U2", "U3"],
64
+ "acc": [0.75, 0.64, 0.83],
65
+ "tau": [0.05, 0.28, 0.16],
66
+ "s": [0.12, 0.27, 0.18]
67
+ }
68
+ df4 = pd.DataFrame(TE)
69
+
70
+ # 创建标签页
71
+ tab1, tab2, tab3, tab4 = st.tabs(["SG", "NFQA", "DG", "TE"])
72
+
73
+ # 在标签页 1 中添加内容
74
+ with tab1:
75
+ st.header("Summary Generation")
76
+ st.dataframe(df1, use_container_width=True)
77
+
78
+ # 在标签页 2 中添加内容
79
+ with tab2:
80
+ st.header("Non-Factoid QA")
81
+ st.dataframe(df2, use_container_width=True)
82
+
83
+ # 在标签页 3 中添加内容
84
+ with tab3:
85
+ st.header("Dialogue Generation")
86
+ st.dataframe(df3, use_container_width=True)
87
+
88
+ # 在标签页 4 中添加内容
89
+ with tab4:
90
+ st.header("Text Expansion")
91
+ st.dataframe(df4, use_container_width=True, )
requirements.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ pandas==2.2.2
2
+ streamlit==1.34.0