File size: 1,516 Bytes
73a9525
 
 
1edab07
 
 
 
 
 
38d9f8d
1edab07
 
 
73a9525
1edab07
 
ed56ab7
1edab07
 
 
ed56ab7
1edab07
 
ed56ab7
1edab07
 
 
ed56ab7
1edab07
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
import streamlit as st
import pandas as pd

# CSS样式
st.markdown("""
<style>
body {
    color: #fff;
    background-color: #333;
}
.stDataFrame {
    font-family: Arial;
    font-size: 16px;
}
.stHeader {
    color: #ff6347;
}
div.stButton > button:first-child {
    background-color: #ff6347;
    color: #fff;
}
</style>
""", unsafe_allow_html=True)

# 标题和描述
st.title('AEOLLM leaderboard')
st.write("This leaderboard is used to show the performance of the automation evaluation methods of LLMs submitted by the AEOLLM team on four tasks: Summary Generation (SG), Non-Factoid QA (NFQA), Dialogue Generation (DG), Text Expansion (TE).")

# 创建示例数据
def create_data():
    return {
        "methods": ["Model A", "Model B", "Model C"],
        "team": ["U1", "U2", "U3"],
        "acc": [0.75, 0.64, 0.83],
        "tau": [0.05, 0.28, 0.16],
        "s": [0.12, 0.27, 0.18]
    }

df1 = pd.DataFrame(create_data())
df2 = pd.DataFrame(create_data())
df3 = pd.DataFrame(create_data())
df4 = pd.DataFrame(create_data())

# 使用列功能进行布局
col1, col2 = st.columns(2)
with col1:
    tab1, tab2 = st.tabs(["SG", "NFQA"])
    with tab1:
        st.header("Summary Generation")
        st.dataframe(df1)
    with tab2:
        st.header("Non-Factoid QA")
        st.dataframe(df2)

with col2:
    tab3, tab4 = st.tabs(["DG", "TE"])
    with tab3:
        st.header("Dialogue Generation")
        st.dataframe(df3)
    with tab4:
        st.header("Text Expansion")
        st.dataframe(df4)