Spaces:
Running
Running
Jimin Huang
commited on
Commit
•
c248d53
1
Parent(s):
96234cc
feature: add auto evaluation tab
Browse files- leaderboard_auto.csv +1 -1
leaderboard_auto.csv
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
llama-7b,0.02,0.08,0.95,0.31,0.02,0.76,0.05,0,0,0,1,0.02,0,0.96,0.08,0,0.84,0.01,0.02,0.99,0,0,0,0,1,0,0,1
|
2 |
bloomz-7b,0.36,0.52,0.03,0.79,0.0,0.61,0.0,0.01,0.54,0.01,0.02,0.48,-0.02,0.06,0.51,-0.03,0.10,0.18,0.31,0.49,0,0,0,0,1,0.57,0.72,0
|
3 |
ChatGpt,0.78,0.78,0.0,,,0.77,0.77,0.58,0.53,-0.025,0,0.5,0.005,0,0.55,0.01,0,,,,,,,,,,,
|
4 |
-
GPT-4,0.76,0.78,0.0,,,0.86,0.83,0.63,0.54,0.03,0,0.52,0.02,0,0.57,0.01,0
|
5 |
FinMA-7B,0.86,0.86,0.0,0.84,0.0,0.98,0.75,0.06,0.48,0.04,0.0,0.5,0.0,0,0.56,-0.02,0.0,0.45,0.58,0.24,0,0,0,0,1,0,0,1
|
6 |
FinMA-7B-full,0.88,0.88,0.0,0.83,0,0.97,0.67,0.06,0.51,0.06,0.0,0.52,0.03,0.0,0.52,0.04,0.0,0.47,0.61,0.24,0,0,0,0,1,0,0,1
|
7 |
Baichuan-7B,0.01,0.02,0.99,0.55,0.03,0.76,0.16,0,0.34,0,0.38,0.32,0,0.38,0.15,0,0.73,0.01,0.06,0.98,0,0,0,0,1,0,0,1
|
|
|
1 |
llama-7b,0.02,0.08,0.95,0.31,0.02,0.76,0.05,0,0,0,1,0.02,0,0.96,0.08,0,0.84,0.01,0.02,0.99,0,0,0,0,1,0,0,1
|
2 |
bloomz-7b,0.36,0.52,0.03,0.79,0.0,0.61,0.0,0.01,0.54,0.01,0.02,0.48,-0.02,0.06,0.51,-0.03,0.10,0.18,0.31,0.49,0,0,0,0,1,0.57,0.72,0
|
3 |
ChatGpt,0.78,0.78,0.0,,,0.77,0.77,0.58,0.53,-0.025,0,0.5,0.005,0,0.55,0.01,0,,,,,,,,,,,
|
4 |
+
GPT-4,0.76,0.78,0.0,,,0.86,0.83,0.63,0.54,0.03,0,0.52,0.02,0,0.57,0.01,0,0.69,0.71,0,,,0.56,0.57,0,0.75,0.75,0
|
5 |
FinMA-7B,0.86,0.86,0.0,0.84,0.0,0.98,0.75,0.06,0.48,0.04,0.0,0.5,0.0,0,0.56,-0.02,0.0,0.45,0.58,0.24,0,0,0,0,1,0,0,1
|
6 |
FinMA-7B-full,0.88,0.88,0.0,0.83,0,0.97,0.67,0.06,0.51,0.06,0.0,0.52,0.03,0.0,0.52,0.04,0.0,0.47,0.61,0.24,0,0,0,0,1,0,0,1
|
7 |
Baichuan-7B,0.01,0.02,0.99,0.55,0.03,0.76,0.16,0,0.34,0,0.38,0.32,0,0.38,0.15,0,0.73,0.01,0.06,0.98,0,0,0,0,1,0,0,1
|