yurakuratov commited on
Commit
43b9e03
Β·
1 Parent(s): 4490eb8

rename avg->avg(qa1-5) and pin model_name column

Browse files
Files changed (2) hide show
  1. app.py +6 -3
  2. draw_utils.py +2 -0
app.py CHANGED
@@ -10,7 +10,7 @@ st.markdown(PAGE_MARKDOWN, unsafe_allow_html=True)
10
  def draw_leaderboard():
11
  df = load_results()
12
 
13
- tasks = ['avg'] + [f"qa{i}" for i in range(1, 11)]
14
  columns = ["model_name", "≀32k", "≀128k"] + LENGTHS
15
 
16
  st.title("πŸ”ŽπŸ“šπŸͺ‘πŸ“šβ“ BABILong Leaderboard πŸ†")
@@ -21,7 +21,7 @@ def draw_leaderboard():
21
  '[BABILong evals](https://huggingface.co/datasets/RMT-team/babilong_evals)')
22
  search_term = st.text_input("Search models:", "")
23
 
24
- tabs = st.tabs([str(task) for task in tasks])
25
  for i, tab in enumerate(tabs):
26
  with tab:
27
  task_df = df[df.task == tasks[i]][columns]
@@ -39,8 +39,11 @@ def draw_leaderboard():
39
 
40
  st.dataframe(
41
  styled_df,
42
- width=1100,
43
  height=height,
 
 
 
44
  )
45
 
46
 
 
10
  def draw_leaderboard():
11
  df = load_results()
12
 
13
+ tasks = ['avg(qa1-5)'] + [f"qa{i}" for i in range(1, 11)]
14
  columns = ["model_name", "≀32k", "≀128k"] + LENGTHS
15
 
16
  st.title("πŸ”ŽπŸ“šπŸͺ‘πŸ“šβ“ BABILong Leaderboard πŸ†")
 
21
  '[BABILong evals](https://huggingface.co/datasets/RMT-team/babilong_evals)')
22
  search_term = st.text_input("Search models:", "")
23
 
24
+ tabs = st.tabs(tasks)
25
  for i, tab in enumerate(tabs):
26
  with tab:
27
  task_df = df[df.task == tasks[i]][columns]
 
39
 
40
  st.dataframe(
41
  styled_df,
42
+ width=1070,
43
  height=height,
44
+ column_config={
45
+ "model_name": st.column_config.Column(width=260, pinned=True)
46
+ }
47
  )
48
 
49
 
draw_utils.py CHANGED
@@ -40,6 +40,8 @@ def load_results():
40
  res = pd.concat([old_results_filtered, new_results])
41
  res.drop('normalized_name', axis=1, inplace=True)
42
 
 
 
43
  res.replace(-1, np.nan, inplace=True)
44
  res['≀32k'] = res[LENGTHS_32k].mean(axis=1)
45
  res['≀128k'] = res[LENGTHS_128k].mean(axis=1)
 
40
  res = pd.concat([old_results_filtered, new_results])
41
  res.drop('normalized_name', axis=1, inplace=True)
42
 
43
+ res['task'] = res['task'].str.replace('avg', 'avg(qa1-5)')
44
+
45
  res.replace(-1, np.nan, inplace=True)
46
  res['≀32k'] = res[LENGTHS_32k].mean(axis=1)
47
  res['≀128k'] = res[LENGTHS_128k].mean(axis=1)