Commit
Β·
43b9e03
1
Parent(s):
4490eb8
rename avg->avg(qa1-5) and pin model_name column
Browse files- app.py +6 -3
- draw_utils.py +2 -0
app.py
CHANGED
@@ -10,7 +10,7 @@ st.markdown(PAGE_MARKDOWN, unsafe_allow_html=True)
|
|
10 |
def draw_leaderboard():
|
11 |
df = load_results()
|
12 |
|
13 |
-
tasks = ['avg'] + [f"qa{i}" for i in range(1, 11)]
|
14 |
columns = ["model_name", "β€32k", "β€128k"] + LENGTHS
|
15 |
|
16 |
st.title("πππͺ‘πβ BABILong Leaderboard π")
|
@@ -21,7 +21,7 @@ def draw_leaderboard():
|
|
21 |
'[BABILong evals](https://huggingface.co/datasets/RMT-team/babilong_evals)')
|
22 |
search_term = st.text_input("Search models:", "")
|
23 |
|
24 |
-
tabs = st.tabs(
|
25 |
for i, tab in enumerate(tabs):
|
26 |
with tab:
|
27 |
task_df = df[df.task == tasks[i]][columns]
|
@@ -39,8 +39,11 @@ def draw_leaderboard():
|
|
39 |
|
40 |
st.dataframe(
|
41 |
styled_df,
|
42 |
-
width=
|
43 |
height=height,
|
|
|
|
|
|
|
44 |
)
|
45 |
|
46 |
|
|
|
10 |
def draw_leaderboard():
|
11 |
df = load_results()
|
12 |
|
13 |
+
tasks = ['avg(qa1-5)'] + [f"qa{i}" for i in range(1, 11)]
|
14 |
columns = ["model_name", "β€32k", "β€128k"] + LENGTHS
|
15 |
|
16 |
st.title("πππͺ‘πβ BABILong Leaderboard π")
|
|
|
21 |
'[BABILong evals](https://huggingface.co/datasets/RMT-team/babilong_evals)')
|
22 |
search_term = st.text_input("Search models:", "")
|
23 |
|
24 |
+
tabs = st.tabs(tasks)
|
25 |
for i, tab in enumerate(tabs):
|
26 |
with tab:
|
27 |
task_df = df[df.task == tasks[i]][columns]
|
|
|
39 |
|
40 |
st.dataframe(
|
41 |
styled_df,
|
42 |
+
width=1070,
|
43 |
height=height,
|
44 |
+
column_config={
|
45 |
+
"model_name": st.column_config.Column(width=260, pinned=True)
|
46 |
+
}
|
47 |
)
|
48 |
|
49 |
|
draw_utils.py
CHANGED
@@ -40,6 +40,8 @@ def load_results():
|
|
40 |
res = pd.concat([old_results_filtered, new_results])
|
41 |
res.drop('normalized_name', axis=1, inplace=True)
|
42 |
|
|
|
|
|
43 |
res.replace(-1, np.nan, inplace=True)
|
44 |
res['β€32k'] = res[LENGTHS_32k].mean(axis=1)
|
45 |
res['β€128k'] = res[LENGTHS_128k].mean(axis=1)
|
|
|
40 |
res = pd.concat([old_results_filtered, new_results])
|
41 |
res.drop('normalized_name', axis=1, inplace=True)
|
42 |
|
43 |
+
res['task'] = res['task'].str.replace('avg', 'avg(qa1-5)')
|
44 |
+
|
45 |
res.replace(-1, np.nan, inplace=True)
|
46 |
res['β€32k'] = res[LENGTHS_32k].mean(axis=1)
|
47 |
res['β€128k'] = res[LENGTHS_128k].mean(axis=1)
|