booydar commited on
Commit
429b741
β€’
1 Parent(s): 649e5b3

add llama-3.1 + visual improvements

Browse files
This view is limited to 50 files because it contains too many changes. Β  See raw diff
Files changed (50) hide show
  1. app.py +14 -7
  2. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/0.csv +0 -0
  3. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/1000000.csv +0 -0
  4. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/10000000.csv +0 -0
  5. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/128000.csv +0 -0
  6. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/16000.csv +0 -0
  7. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/32000.csv +0 -0
  8. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/4000.csv +0 -0
  9. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/500000.csv +0 -0
  10. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/64000.csv +0 -0
  11. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/8000.csv +0 -0
  12. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/0.csv +0 -0
  13. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/1000000.csv +0 -0
  14. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/10000000.csv +0 -0
  15. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/128000.csv +0 -0
  16. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/16000.csv +0 -0
  17. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/32000.csv +0 -0
  18. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/4000.csv +0 -0
  19. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/500000.csv +0 -0
  20. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/64000.csv +0 -0
  21. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/8000.csv +0 -0
  22. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/0.csv +0 -0
  23. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/1000000.csv +0 -0
  24. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/10000000.csv +0 -0
  25. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/128000.csv +0 -0
  26. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/16000.csv +0 -0
  27. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/32000.csv +0 -0
  28. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/4000.csv +0 -0
  29. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/500000.csv +0 -0
  30. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/64000.csv +0 -0
  31. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/8000.csv +0 -0
  32. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/0.csv +0 -0
  33. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/1000000.csv +0 -0
  34. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/10000000.csv +0 -0
  35. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/128000.csv +0 -0
  36. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/16000.csv +0 -0
  37. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/32000.csv +0 -0
  38. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/4000.csv +0 -0
  39. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/500000.csv +0 -0
  40. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/64000.csv +0 -0
  41. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/8000.csv +0 -0
  42. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/0.csv +0 -0
  43. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/1000000.csv +0 -0
  44. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/10000000.csv +0 -0
  45. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/128000.csv +0 -0
  46. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/16000.csv +0 -0
  47. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/32000.csv +0 -0
  48. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/4000.csv +0 -0
  49. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/500000.csv +0 -0
  50. results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/64000.csv +0 -0
app.py CHANGED
@@ -50,7 +50,8 @@ def load_model(folders, tab_name, msg_lengths):
50
 
51
  for i, folder in enumerate(folders):
52
  model_name = folder.split('/')[-1]
53
- results['Rank'].append(i)
 
54
  results['Model'].append(model_name)
55
  for task in msg_lengths:
56
  if not os.path.isfile(f'{folder}/{tab_name}/{task}.csv'):
@@ -60,13 +61,19 @@ def load_model(folders, tab_name, msg_lengths):
60
  results[msg_lengths[task]].append(int(df['result'].sum() / len(df) * 100))
61
 
62
  mean_score.append(-np.mean([float(results[msg_lengths[task]][i]) for task in list(msg_lengths.keys())[:10]]))
63
- for rank, i in enumerate(np.argsort(mean_score)):
64
- results['Rank'][i] = rank + 1
65
 
66
- res_df = pd.DataFrame(results).sort_values(['Rank'])
67
- # print(res_df.head())
68
- res_df['Avg ≀32k'] = res_df[res_df.columns[2:7]].astype(float).fillna(0).mean(axis=1).astype(int)
69
- res_df['Avg ≀128k'] = res_df[res_df.columns[2:9]].astype(float).fillna(0).mean(axis=1).astype(int)
 
 
 
 
 
 
 
 
70
  return res_df
71
 
72
  def build_leaderboard_tab(folders):
 
50
 
51
  for i, folder in enumerate(folders):
52
  model_name = folder.split('/')[-1]
53
+ if 'fine-tune' in model_name:
54
+ model_name += ' πŸ› οΈ'
55
  results['Model'].append(model_name)
56
  for task in msg_lengths:
57
  if not os.path.isfile(f'{folder}/{tab_name}/{task}.csv'):
 
61
  results[msg_lengths[task]].append(int(df['result'].sum() / len(df) * 100))
62
 
63
  mean_score.append(-np.mean([float(results[msg_lengths[task]][i]) for task in list(msg_lengths.keys())[:10]]))
 
 
64
 
65
+ res_df = pd.DataFrame(results)
66
+ lengths = list(msg_lengths.values())
67
+ res_df['mean_score'] = mean_score
68
+ res_df['num_lengths'] = -(res_df[lengths].astype(float) > 0).sum(axis=1)
69
+ res_df = res_df[res_df.num_lengths != 0]
70
+ res_df.sort_values(['num_lengths', 'mean_score'], inplace=True)
71
+ res_df['Rank'] = range(1, res_df.shape[0] + 1)
72
+
73
+ res_df['Avg ≀32k'] = res_df[lengths[:5]].astype(float).fillna(0).mean(axis=1).astype(int)
74
+ res_df['Avg ≀128k'] = res_df[lengths[:7]].astype(float).fillna(0).mean(axis=1).astype(int)
75
+ ordered_columns = ['Rank', 'Model', 'Avg ≀32k', 'Avg ≀128k'] + lengths
76
+ res_df = res_df[ordered_columns]
77
  return res_df
78
 
79
  def build_leaderboard_tab(folders):
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/0.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/1000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/10000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/128000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/16000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/32000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/4000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/500000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/64000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/avg/8000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/0.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/1000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/10000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/128000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/16000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/32000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/4000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/500000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/64000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa1/8000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/0.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/1000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/10000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/128000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/16000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/32000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/4000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/500000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/64000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa2/8000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/0.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/1000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/10000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/128000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/16000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/32000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/4000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/500000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/64000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa3/8000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/0.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/1000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/10000000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/128000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/16000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/32000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/4000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/500000.csv RENAMED
File without changes
results/{~ ARMT (137M) fine-tune β†’ ARMT (137M) fine-tune}/qa4/64000.csv RENAMED
File without changes