Spaces:
Running
Running
黄济民
commited on
Commit
•
bd8528a
1
Parent(s):
2c6c950
feature: add auto evaluation tab
Browse files- app.py +0 -1
- leaderboard_auto.csv +2 -0
app.py
CHANGED
@@ -36,7 +36,6 @@ COLS_AUTO = [
|
|
36 |
("FiQA-SA-F1", "number"),
|
37 |
("FiQA-SA-missing", "number"),
|
38 |
("Headline-AvgF1", "number"),
|
39 |
-
("Headline-missing", "number"),
|
40 |
("NER-EntityF1", "number"),
|
41 |
("FinQA-EmAcc", "number"),
|
42 |
("BigData22-Acc", "number"),
|
|
|
36 |
("FiQA-SA-F1", "number"),
|
37 |
("FiQA-SA-missing", "number"),
|
38 |
("Headline-AvgF1", "number"),
|
|
|
39 |
("NER-EntityF1", "number"),
|
40 |
("FinQA-EmAcc", "number"),
|
41 |
("BigData22-Acc", "number"),
|
leaderboard_auto.csv
CHANGED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
llama-7b,0.02,0.08,0.95,0.31,0.02,0.76,0.05,0,0,0,1,0,0,1,0,0,1,0.01,0.02,0.99,0,0,0,0,1,0,0,1
|
2 |
+
bloomz-7b,0.36,0.52,0.03,0.79,0.0,0.61,0.0,0.01,0,0,1,0,0,1,0,0,1,0.18,0.31,0.49,0,0,0,0,1,0.57,0.72,0
|