Jimin Huang commited on
Commit
c248d53
1 Parent(s): 96234cc

feature: add auto evaluation tab

Browse files
Files changed (1) hide show
  1. leaderboard_auto.csv +1 -1
leaderboard_auto.csv CHANGED
@@ -1,7 +1,7 @@
1
  llama-7b,0.02,0.08,0.95,0.31,0.02,0.76,0.05,0,0,0,1,0.02,0,0.96,0.08,0,0.84,0.01,0.02,0.99,0,0,0,0,1,0,0,1
2
  bloomz-7b,0.36,0.52,0.03,0.79,0.0,0.61,0.0,0.01,0.54,0.01,0.02,0.48,-0.02,0.06,0.51,-0.03,0.10,0.18,0.31,0.49,0,0,0,0,1,0.57,0.72,0
3
  ChatGpt,0.78,0.78,0.0,,,0.77,0.77,0.58,0.53,-0.025,0,0.5,0.005,0,0.55,0.01,0,,,,,,,,,,,
4
- GPT-4,0.76,0.78,0.0,,,0.86,0.83,0.63,0.54,0.03,0,0.52,0.02,0,0.57,0.01,0,,,,,,,,,,,
5
  FinMA-7B,0.86,0.86,0.0,0.84,0.0,0.98,0.75,0.06,0.48,0.04,0.0,0.5,0.0,0,0.56,-0.02,0.0,0.45,0.58,0.24,0,0,0,0,1,0,0,1
6
  FinMA-7B-full,0.88,0.88,0.0,0.83,0,0.97,0.67,0.06,0.51,0.06,0.0,0.52,0.03,0.0,0.52,0.04,0.0,0.47,0.61,0.24,0,0,0,0,1,0,0,1
7
  Baichuan-7B,0.01,0.02,0.99,0.55,0.03,0.76,0.16,0,0.34,0,0.38,0.32,0,0.38,0.15,0,0.73,0.01,0.06,0.98,0,0,0,0,1,0,0,1
 
1
  llama-7b,0.02,0.08,0.95,0.31,0.02,0.76,0.05,0,0,0,1,0.02,0,0.96,0.08,0,0.84,0.01,0.02,0.99,0,0,0,0,1,0,0,1
2
  bloomz-7b,0.36,0.52,0.03,0.79,0.0,0.61,0.0,0.01,0.54,0.01,0.02,0.48,-0.02,0.06,0.51,-0.03,0.10,0.18,0.31,0.49,0,0,0,0,1,0.57,0.72,0
3
  ChatGpt,0.78,0.78,0.0,,,0.77,0.77,0.58,0.53,-0.025,0,0.5,0.005,0,0.55,0.01,0,,,,,,,,,,,
4
+ GPT-4,0.76,0.78,0.0,,,0.86,0.83,0.63,0.54,0.03,0,0.52,0.02,0,0.57,0.01,0,0.69,0.71,0,,,0.56,0.57,0,0.75,0.75,0
5
  FinMA-7B,0.86,0.86,0.0,0.84,0.0,0.98,0.75,0.06,0.48,0.04,0.0,0.5,0.0,0,0.56,-0.02,0.0,0.45,0.58,0.24,0,0,0,0,1,0,0,1
6
  FinMA-7B-full,0.88,0.88,0.0,0.83,0,0.97,0.67,0.06,0.51,0.06,0.0,0.52,0.03,0.0,0.52,0.04,0.0,0.47,0.61,0.24,0,0,0,0,1,0,0,1
7
  Baichuan-7B,0.01,0.02,0.99,0.55,0.03,0.76,0.16,0,0.34,0,0.38,0.32,0,0.38,0.15,0,0.73,0.01,0.06,0.98,0,0,0,0,1,0,0,1