Spaces:
Running
Running
booydar
commited on
Commit
Β·
429b741
1
Parent(s):
649e5b3
add llama-3.1 + visual improvements
Browse filesThis view is limited to 50 files because it contains too many changes. Β
See raw diff
- app.py +14 -7
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/0.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/1000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/10000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/128000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/16000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/32000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/4000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/500000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/64000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/8000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/0.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/1000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/10000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/128000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/16000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/32000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/4000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/500000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/64000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/8000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/0.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/1000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/10000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/128000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/16000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/32000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/4000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/500000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/64000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/8000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/0.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/1000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/10000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/128000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/16000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/32000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/4000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/500000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/64000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/8000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/0.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/1000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/10000000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/128000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/16000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/32000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/4000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/500000.csv +0 -0
- results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/64000.csv +0 -0
app.py
CHANGED
@@ -50,7 +50,8 @@ def load_model(folders, tab_name, msg_lengths):
|
|
50 |
|
51 |
for i, folder in enumerate(folders):
|
52 |
model_name = folder.split('/')[-1]
|
53 |
-
|
|
|
54 |
results['Model'].append(model_name)
|
55 |
for task in msg_lengths:
|
56 |
if not os.path.isfile(f'{folder}/{tab_name}/{task}.csv'):
|
@@ -60,13 +61,19 @@ def load_model(folders, tab_name, msg_lengths):
|
|
60 |
results[msg_lengths[task]].append(int(df['result'].sum() / len(df) * 100))
|
61 |
|
62 |
mean_score.append(-np.mean([float(results[msg_lengths[task]][i]) for task in list(msg_lengths.keys())[:10]]))
|
63 |
-
for rank, i in enumerate(np.argsort(mean_score)):
|
64 |
-
results['Rank'][i] = rank + 1
|
65 |
|
66 |
-
res_df = pd.DataFrame(results)
|
67 |
-
|
68 |
-
res_df['
|
69 |
-
res_df['
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
70 |
return res_df
|
71 |
|
72 |
def build_leaderboard_tab(folders):
|
|
|
50 |
|
51 |
for i, folder in enumerate(folders):
|
52 |
model_name = folder.split('/')[-1]
|
53 |
+
if 'fine-tune' in model_name:
|
54 |
+
model_name += ' π οΈ'
|
55 |
results['Model'].append(model_name)
|
56 |
for task in msg_lengths:
|
57 |
if not os.path.isfile(f'{folder}/{tab_name}/{task}.csv'):
|
|
|
61 |
results[msg_lengths[task]].append(int(df['result'].sum() / len(df) * 100))
|
62 |
|
63 |
mean_score.append(-np.mean([float(results[msg_lengths[task]][i]) for task in list(msg_lengths.keys())[:10]]))
|
|
|
|
|
64 |
|
65 |
+
res_df = pd.DataFrame(results)
|
66 |
+
lengths = list(msg_lengths.values())
|
67 |
+
res_df['mean_score'] = mean_score
|
68 |
+
res_df['num_lengths'] = -(res_df[lengths].astype(float) > 0).sum(axis=1)
|
69 |
+
res_df = res_df[res_df.num_lengths != 0]
|
70 |
+
res_df.sort_values(['num_lengths', 'mean_score'], inplace=True)
|
71 |
+
res_df['Rank'] = range(1, res_df.shape[0] + 1)
|
72 |
+
|
73 |
+
res_df['Avg β€32k'] = res_df[lengths[:5]].astype(float).fillna(0).mean(axis=1).astype(int)
|
74 |
+
res_df['Avg β€128k'] = res_df[lengths[:7]].astype(float).fillna(0).mean(axis=1).astype(int)
|
75 |
+
ordered_columns = ['Rank', 'Model', 'Avg β€32k', 'Avg β€128k'] + lengths
|
76 |
+
res_df = res_df[ordered_columns]
|
77 |
return res_df
|
78 |
|
79 |
def build_leaderboard_tab(folders):
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/0.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/1000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/10000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/128000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/16000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/32000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/4000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/500000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/64000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/avg/8000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/0.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/1000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/10000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/128000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/16000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/32000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/4000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/500000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/64000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa1/8000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/0.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/1000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/10000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/128000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/16000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/32000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/4000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/500000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/64000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa2/8000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/0.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/1000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/10000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/128000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/16000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/32000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/4000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/500000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/64000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa3/8000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/0.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/1000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/10000000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/128000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/16000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/32000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/4000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/500000.csv
RENAMED
File without changes
|
results/{~ ARMT (137M) fine-tune β ARMT (137M) fine-tune}/qa4/64000.csv
RENAMED
File without changes
|