MohamedRashad commited on
Commit
85ca42c
·
1 Parent(s): cf880c9

Refactor leaderboard functionality: update model display to clickable links, improve search logic, and remove unused retrieval_results.json

Browse files
Files changed (2) hide show
  1. app.py +26 -12
  2. results/retrieval_results.json +0 -18
app.py CHANGED
@@ -40,25 +40,23 @@ CITATION_BUTTON_TEXT = """
40
  }
41
  """
42
 
43
- df = load_retrieval_results()
44
- df[["Model"]] = df[["Model"]].applymap(lambda x: f'<a href="https://huggingface.co/{x}" target="_blank">{x}</a>')
45
- print(df)
46
 
47
  def search_leaderboard(model_name):
48
- if not model_name:
49
  return df
50
 
51
  threshold = 95 # You can adjust this value to make the search more or less strict
52
 
53
  def calculate_similarity(row):
54
- similarity = fuzz.partial_ratio(model_name.lower(), row['model'].lower())
55
  return similarity if similarity >= threshold else 0
56
 
57
  # Add a new column for similarity scores
58
- df['similarity'] = df.apply(calculate_similarity, axis=1)
59
 
60
  # Filter and sort the dataframe
61
- filtered_df = df[df['similarity'] > 0].sort_values('similarity', ascending=False)
62
 
63
  # Remove the similarity column before returning
64
  filtered_df = filtered_df.drop('similarity', axis=1)
@@ -67,7 +65,12 @@ def search_leaderboard(model_name):
67
 
68
 
69
  def main():
70
- columns_to_show = ["Model", "Model Size", "Embedding Dimension", "Max Tokens", "Web Search Dataset (MRR)", "Web Search Dataset (nDCG@k=None)"]
 
 
 
 
 
71
  with gr.Blocks() as demo:
72
  gr.HTML(HEADER)
73
 
@@ -79,19 +82,30 @@ def main():
79
  search_box_retrieval = gr.Textbox(
80
  placeholder="Search for models...",
81
  label="Search",
82
- interactive=True
 
 
 
 
 
 
83
  )
84
 
85
  retrieval_leaderboard = gr.Dataframe(
86
- df[columns_to_show],
87
  datatype="markdown",
88
  interactive=False
89
  )
90
 
91
  # Submit the search box and the leaderboard
92
- search_box_retrieval.submit(
93
  search_leaderboard,
94
- inputs=search_box_retrieval,
 
 
 
 
 
95
  outputs=retrieval_leaderboard
96
  )
97
 
 
40
  }
41
  """
42
 
43
+ df = None
 
 
44
 
45
  def search_leaderboard(model_name):
46
+ if len(model_name.strip()) == 0:
47
  return df
48
 
49
  threshold = 95 # You can adjust this value to make the search more or less strict
50
 
51
  def calculate_similarity(row):
52
+ similarity = fuzz.partial_ratio(model_name.lower(), row["Model"].lower())
53
  return similarity if similarity >= threshold else 0
54
 
55
  # Add a new column for similarity scores
56
+ df["similarity"] = df.apply(calculate_similarity, axis=1)
57
 
58
  # Filter and sort the dataframe
59
+ filtered_df = df[df["similarity"] > 0].sort_values('similarity', ascending=False)
60
 
61
  # Remove the similarity column before returning
62
  filtered_df = filtered_df.drop('similarity', axis=1)
 
65
 
66
 
67
  def main():
68
+ global df
69
+ df = load_retrieval_results()
70
+ df[["Model"]] = df[["Model"]].applymap(lambda x: f'<a href="https://huggingface.co/{x}" target="_blank">{x}</a>')
71
+ df.drop(columns=["Revision", "Precision", "Task"], inplace=True)
72
+
73
+ columns_to_show = ["Model", "Model Size", "Embedding Dimension", "Max Tokens", "Num Likes", "Web Search Dataset (Overall Score)"]
74
  with gr.Blocks() as demo:
75
  gr.HTML(HEADER)
76
 
 
82
  search_box_retrieval = gr.Textbox(
83
  placeholder="Search for models...",
84
  label="Search",
85
+ scale=5
86
+ )
87
+ columns_to_show_input = gr.CheckboxGroup(
88
+ label="Columns to Show",
89
+ choices=df.columns.tolist(),
90
+ value=columns_to_show,
91
+ scale=4
92
  )
93
 
94
  retrieval_leaderboard = gr.Dataframe(
95
+ value=df[columns_to_show],
96
  datatype="markdown",
97
  interactive=False
98
  )
99
 
100
  # Submit the search box and the leaderboard
101
+ search_box_retrieval.input(
102
  search_leaderboard,
103
+ inputs=[search_box_retrieval],
104
+ outputs=retrieval_leaderboard
105
+ )
106
+ columns_to_show_input.select(
107
+ lambda columns: gr.update(value=df[[col for col in df.columns if col in columns]]),
108
+ inputs=columns_to_show_input,
109
  outputs=retrieval_leaderboard
110
  )
111
 
results/retrieval_results.json DELETED
@@ -1,18 +0,0 @@
1
- [
2
- {
3
- "Model": "intfloat/multilingual-e5-large-instruct",
4
- "Revision": "main",
5
- "Precision": "f16",
6
- "Task": "Retriever",
7
- "Num Downloads": 365122,
8
- "Num Likes": 279,
9
- "License": "mit",
10
- "Model Size": 560,
11
- "Embedding Dimension": 1024,
12
- "Max Tokens": 512,
13
- "Web Search Dataset (MRR)": 0.6526209043734583,
14
- "Web Search Dataset (nDCG@k=None)": 0.7165619055124024,
15
- "Web Search Dataset (Recall@5)": 0.7414125820146662,
16
- "Web Search Dataset (Overall Score)": 0.7035317973001757
17
- }
18
- ]