Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -3,7 +3,6 @@ import ast
|
|
3 |
import argparse
|
4 |
import glob
|
5 |
import pickle
|
6 |
-
|
7 |
import gradio as gr
|
8 |
import numpy as np
|
9 |
import pandas as pd
|
@@ -11,8 +10,6 @@ import os
|
|
11 |
from collections import defaultdict
|
12 |
from matplotlib.colors import LinearSegmentedColormap
|
13 |
|
14 |
-
|
15 |
-
|
16 |
def make_default_md():
|
17 |
leaderboard_md = f"""
|
18 |
# πππͺ‘πβ BABIlong Leaderboard π
|
@@ -23,12 +20,10 @@ def make_default_md():
|
|
23 |
"""
|
24 |
return leaderboard_md
|
25 |
|
26 |
-
|
27 |
def make_arena_leaderboard_md(total_models):
|
28 |
-
leaderboard_md = f"""Total #models: **{total_models}**. Last updated:
|
29 |
return leaderboard_md
|
30 |
|
31 |
-
|
32 |
def make_model_desc_md(f_len):
|
33 |
desc_md = make_arena_leaderboard_md(f_len)
|
34 |
models = next(os.walk('info'))[2]
|
@@ -36,15 +31,12 @@ def make_model_desc_md(f_len):
|
|
36 |
model_name = model.split('.md')[0]
|
37 |
with open(os.path.join('info', model), 'r') as f:
|
38 |
description = f.read()
|
39 |
-
|
40 |
desc_md += f"\n\n### {model_name}\n{description}"
|
41 |
return desc_md
|
42 |
|
43 |
-
|
44 |
def model_hyperlink(model_name, link):
|
45 |
return f'<a target="_blank" href="{link}" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">{model_name}</a>'
|
46 |
|
47 |
-
|
48 |
def load_model(folders, tab_name, msg_lengths):
|
49 |
results = defaultdict(list)
|
50 |
|
@@ -53,7 +45,7 @@ def load_model(folders, tab_name, msg_lengths):
|
|
53 |
return '-'
|
54 |
def __float__(self):
|
55 |
return 0.0
|
56 |
-
|
57 |
mean_score = []
|
58 |
|
59 |
for i, folder in enumerate(folders):
|
@@ -71,11 +63,8 @@ def load_model(folders, tab_name, msg_lengths):
|
|
71 |
for rank, i in enumerate(np.argsort(mean_score)):
|
72 |
results['Rank'][i] = rank + 1
|
73 |
|
74 |
-
|
75 |
return pd.DataFrame(results).sort_values(['Rank'])
|
76 |
|
77 |
-
|
78 |
-
|
79 |
def build_leaderboard_tab(folders):
|
80 |
default_md = make_default_md()
|
81 |
md_1 = gr.Markdown(default_md, elem_id="leaderboard_markdown")
|
@@ -93,7 +82,7 @@ def build_leaderboard_tab(folders):
|
|
93 |
}
|
94 |
|
95 |
with gr.Tabs() as tabs:
|
96 |
-
for tab_id, tab_name in enumerate(['qa1','qa2', 'qa3', 'qa4', '
|
97 |
df = load_model(folders, tab_name, msg_lengths)
|
98 |
cmap = LinearSegmentedColormap.from_list('ryg', ["red", "yellow", "green"], N=256)
|
99 |
|
@@ -125,7 +114,7 @@ def build_leaderboard_tab(folders):
|
|
125 |
wrap=True,
|
126 |
)
|
127 |
|
128 |
-
with gr.Tab("
|
129 |
desc_md = make_model_desc_md(len(folders))
|
130 |
gr.Markdown(desc_md, elem_id="leaderboard_markdown")
|
131 |
|
@@ -169,8 +158,6 @@ footer {
|
|
169 |
}
|
170 |
"""
|
171 |
|
172 |
-
|
173 |
-
|
174 |
def build_demo(folders):
|
175 |
text_size = gr.themes.sizes.text_lg
|
176 |
|
|
|
3 |
import argparse
|
4 |
import glob
|
5 |
import pickle
|
|
|
6 |
import gradio as gr
|
7 |
import numpy as np
|
8 |
import pandas as pd
|
|
|
10 |
from collections import defaultdict
|
11 |
from matplotlib.colors import LinearSegmentedColormap
|
12 |
|
|
|
|
|
13 |
def make_default_md():
|
14 |
leaderboard_md = f"""
|
15 |
# πππͺ‘πβ BABIlong Leaderboard π
|
|
|
20 |
"""
|
21 |
return leaderboard_md
|
22 |
|
|
|
23 |
def make_arena_leaderboard_md(total_models):
|
24 |
+
leaderboard_md = f"""Total #models: **{total_models}**. Last updated: May 09, 2024."""
|
25 |
return leaderboard_md
|
26 |
|
|
|
27 |
def make_model_desc_md(f_len):
|
28 |
desc_md = make_arena_leaderboard_md(f_len)
|
29 |
models = next(os.walk('info'))[2]
|
|
|
31 |
model_name = model.split('.md')[0]
|
32 |
with open(os.path.join('info', model), 'r') as f:
|
33 |
description = f.read()
|
|
|
34 |
desc_md += f"\n\n### {model_name}\n{description}"
|
35 |
return desc_md
|
36 |
|
|
|
37 |
def model_hyperlink(model_name, link):
|
38 |
return f'<a target="_blank" href="{link}" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">{model_name}</a>'
|
39 |
|
|
|
40 |
def load_model(folders, tab_name, msg_lengths):
|
41 |
results = defaultdict(list)
|
42 |
|
|
|
45 |
return '-'
|
46 |
def __float__(self):
|
47 |
return 0.0
|
48 |
+
|
49 |
mean_score = []
|
50 |
|
51 |
for i, folder in enumerate(folders):
|
|
|
63 |
for rank, i in enumerate(np.argsort(mean_score)):
|
64 |
results['Rank'][i] = rank + 1
|
65 |
|
|
|
66 |
return pd.DataFrame(results).sort_values(['Rank'])
|
67 |
|
|
|
|
|
68 |
def build_leaderboard_tab(folders):
|
69 |
default_md = make_default_md()
|
70 |
md_1 = gr.Markdown(default_md, elem_id="leaderboard_markdown")
|
|
|
82 |
}
|
83 |
|
84 |
with gr.Tabs() as tabs:
|
85 |
+
for tab_id, tab_name in enumerate(['qa1','qa2', 'qa3', 'qa4', 'qa5']):
|
86 |
df = load_model(folders, tab_name, msg_lengths)
|
87 |
cmap = LinearSegmentedColormap.from_list('ryg', ["red", "yellow", "green"], N=256)
|
88 |
|
|
|
114 |
wrap=True,
|
115 |
)
|
116 |
|
117 |
+
with gr.Tab("Description", id=tab_id + 1):
|
118 |
desc_md = make_model_desc_md(len(folders))
|
119 |
gr.Markdown(desc_md, elem_id="leaderboard_markdown")
|
120 |
|
|
|
158 |
}
|
159 |
"""
|
160 |
|
|
|
|
|
161 |
def build_demo(folders):
|
162 |
text_size = gr.themes.sizes.text_lg
|
163 |
|