黄济民 commited on
Commit
129288f
1 Parent(s): eb2320a

Add application files

Browse files
Files changed (2) hide show
  1. app.py +21 -0
  2. leaderboard.csv +9 -14
app.py CHANGED
@@ -9,6 +9,25 @@ leaderboard_df = pd.read_csv('leaderboard.csv').transpose()
9
  TITLE = "Leaderboard"
10
  INTRODUCTION_TEXT = "This is the leaderboard."
11
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  def launch_gradio():
13
  demo = gr.Blocks()
14
 
@@ -19,6 +38,8 @@ def launch_gradio():
19
  # Create a gradio table from pandas dataframe
20
  leaderboard_table = gr.components.Dataframe(
21
  value=leaderboard_df,
 
 
22
  max_rows=5,
23
  elem_id="leaderboard-table",
24
  )
 
9
  TITLE = "Leaderboard"
10
  INTRODUCTION_TEXT = "This is the leaderboard."
11
 
12
+ COLS = [
13
+ ("Model", "str"),
14
+ ("FPB-acc", "number"),
15
+ ("FPB-F1", "number"),
16
+ ("FiQA-SA-F1", "number"),
17
+ ("Headline-AvgF1", "number"),
18
+ ("NER-EntityF1", "number"),
19
+ ("FinQA-EmAcc", "number"),
20
+ ("ConvFinQA-EmAcc", "number"),
21
+ ("BigData22-Acc", "number"),
22
+ ("BigData22-MCC", "number"),
23
+ ("ACL18-Acc", "number"),
24
+ ("ACL18-MCC", "number"),
25
+ ("CIKM18-Acc", "number"),
26
+ ("CIKM18-MCC", "number")
27
+ ]
28
+
29
+ TYPES = [col_type for _, col_type in COLS]
30
+
31
  def launch_gradio():
32
  demo = gr.Blocks()
33
 
 
38
  # Create a gradio table from pandas dataframe
39
  leaderboard_table = gr.components.Dataframe(
40
  value=leaderboard_df,
41
+ headers=[col_name for col_name, _ in COLS],
42
+ datatype=TYPES,
43
  max_rows=5,
44
  elem_id="leaderboard-table",
45
  )
leaderboard.csv CHANGED
@@ -1,14 +1,9 @@
1
- Dataset,Metrics,GPT NeoX,OPT 66B,BLOOM,Chat GPT,GPT 4,Bloomberg GPT,FinMA 7B,FinMA 30B,FinMA 7B-full
2
- FPB,Acc,-,-,-,0.78,0.76,-,0.86,0.87,0.87
3
- FPB,F1,0.45,0.49,0.50,0.78,0.78,0.51,0.86,0.88,0.87
4
- FiQA-SA,F1,0.51,0.52,0.53,-,-,0.75,0.84,0.87,0.79
5
- Headline,AvgF1,0.73,0.79,0.77,0.77,0.86,0.82,0.98,0.97,0.97
6
- NER,EntityF1,0.61,0.57,0.56,0.77,0.83,0.61,0.75,0.62,0.69
7
- FinQA,EmAcc,-,-,-,0.58,0.63,-,0.06,0.11,0.04
8
- ConvFinQA,EmAcc,0.28,0.30,0.36,0.60,0.76,0.43,0.25,0.40,0.20
9
- BigData22,Acc,-,-,-,0.53,0.54,-,0.48,0.47,0.49
10
- BigData22,MCC,-,-,-,-0.025,0.03,-,0.04,0.04,0.01
11
- ACL18,Acc,-,-,-,0.50,0.52,-,0.50,0.49,0.56
12
- ACL18,MCC,-,-,-,0.005,0.02,-,0.00,0.00,0.10
13
- CIKM18,Acc,-,-,-,0.55,0.57,-,0.56,0.43,0.53
14
- CIKM18,MCC,-,-,-,0.01,0.02,-,-0.02,-0.05,-0.03
 
1
+ GPT NeoX,NaN,0.45,0.51,0.73,0.61,NaN,0.28,NaN,NaN,NaN,NaN,NaN,NaN
2
+ OPT 66B,NaN,0.49,0.52,0.79,0.57,NaN,0.30,NaN,NaN,NaN,NaN,NaN,NaN
3
+ BLOOM,NaN,0.50,0.53,0.77,0.56,NaN,0.36,NaN,NaN,NaN,NaN,NaN,NaN
4
+ Chat GPT,0.78,0.78,NaN,0.77,0.77,0.58,0.60,0.53,NaN,NaN,0.50,0.55,NaN
5
+ GPT 4,0.76,0.78,NaN,0.86,0.83,0.63,0.76,0.54,0.03,0.52,0.02,0.57,0.01
6
+ Bloomberg GPT,NaN,0.51,0.75,0.82,0.61,NaN,0.43,NaN,0.04,NaN,0.00,NaN,NaN
7
+ FinMA 7B,0.86,0.86,0.84,0.98,0.75,NaN,0.25,NaN,NaN,NaN,NaN,NaN,NaN
8
+ FinMA 30B,0.87,0.88,0.87,0.97,0.62,0.06,0.40,0.48,0.04,0.50,0.00,0.56,NaN
9
+ FinMA 7B-full,0.87,0.87,0.79,0.97,0.69,0.11,0.20,0.47,0.01,0.49,0.10,-0.03