Spaces:
Running
Running
Alvaro Romo
commited on
Commit
·
b7f9bcb
1
Parent(s):
c2f297a
Added filter data
Browse files
app.py
CHANGED
@@ -19,6 +19,19 @@ HF_TOKEN = os.environ.get("HF_TOKEN", None)
|
|
19 |
request_file = Path("user_request/") / f"data_{uuid.uuid4()}.json"
|
20 |
request_folder = request_file.parent
|
21 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
22 |
scheduler = CommitScheduler(
|
23 |
repo_id="iberbench/ivace-user-request",
|
24 |
repo_type="dataset",
|
@@ -52,17 +65,6 @@ def get_url(html_content: str) -> str:
|
|
52 |
@st.cache_data
|
53 |
def load_data() -> pd.DataFrame:
|
54 |
try:
|
55 |
-
columns = [
|
56 |
-
"eval_name",
|
57 |
-
"Model",
|
58 |
-
"Type",
|
59 |
-
"Average ⬆️",
|
60 |
-
"IFEval",
|
61 |
-
"MMLU-PRO",
|
62 |
-
"GPQA",
|
63 |
-
"MUSR",
|
64 |
-
"CO₂ cost (kg)",
|
65 |
-
]
|
66 |
data = (
|
67 |
load_dataset("open-llm-leaderboard/contents")["train"]
|
68 |
.to_pandas()
|
@@ -72,14 +74,39 @@ def load_data() -> pd.DataFrame:
|
|
72 |
data["Model"] = data["Model"].apply(get_url)
|
73 |
data.sort_values(by="Average ⬆️", ascending=False, inplace=True)
|
74 |
data.reset_index(drop=True, inplace=True)
|
|
|
|
|
|
|
75 |
return data
|
76 |
except FileNotFoundError:
|
77 |
st.error("open-llm-leaderboard/contents was not found in the hub")
|
78 |
return pd.DataFrame()
|
79 |
|
80 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
81 |
# streamlit UI
|
82 |
leaderboard_data = load_data()
|
|
|
|
|
|
|
83 |
tabs = st.tabs(["Leaderboard", "Submit model"])
|
84 |
|
85 |
with tabs[0]:
|
@@ -101,13 +128,20 @@ with tabs[0]:
|
|
101 |
""",
|
102 |
unsafe_allow_html=True,
|
103 |
)
|
104 |
-
|
105 |
-
|
106 |
-
|
107 |
-
|
108 |
-
leaderboard_data
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
109 |
column_config={"Model": st.column_config.LinkColumn("Model")},
|
110 |
-
hide_index=False,
|
111 |
)
|
112 |
else:
|
113 |
st.write("No data found to display on leaderboard.")
|
|
|
19 |
request_file = Path("user_request/") / f"data_{uuid.uuid4()}.json"
|
20 |
request_folder = request_file.parent
|
21 |
|
22 |
+
# column order
|
23 |
+
columns = [
|
24 |
+
"eval_name",
|
25 |
+
"Model",
|
26 |
+
"Type",
|
27 |
+
"Average ⬆️",
|
28 |
+
"IFEval",
|
29 |
+
"MMLU-PRO",
|
30 |
+
"GPQA",
|
31 |
+
"MUSR",
|
32 |
+
"CO₂ cost (kg)",
|
33 |
+
]
|
34 |
+
|
35 |
scheduler = CommitScheduler(
|
36 |
repo_id="iberbench/ivace-user-request",
|
37 |
repo_type="dataset",
|
|
|
65 |
@st.cache_data
|
66 |
def load_data() -> pd.DataFrame:
|
67 |
try:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
68 |
data = (
|
69 |
load_dataset("open-llm-leaderboard/contents")["train"]
|
70 |
.to_pandas()
|
|
|
74 |
data["Model"] = data["Model"].apply(get_url)
|
75 |
data.sort_values(by="Average ⬆️", ascending=False, inplace=True)
|
76 |
data.reset_index(drop=True, inplace=True)
|
77 |
+
# add column to apply filtering
|
78 |
+
data["Active"] = False
|
79 |
+
|
80 |
return data
|
81 |
except FileNotFoundError:
|
82 |
st.error("open-llm-leaderboard/contents was not found in the hub")
|
83 |
return pd.DataFrame()
|
84 |
|
85 |
|
86 |
+
# functions to create filter
|
87 |
+
def active_data() -> pd.DataFrame:
|
88 |
+
"""Change all records as active"""
|
89 |
+
return st.session_state["leaderboard_data"][st.session_state["leaderboard_data"]["Active"] == True].copy()
|
90 |
+
|
91 |
+
|
92 |
+
def get_index(row) -> pd.Series:
|
93 |
+
"""Get index of the row"""
|
94 |
+
return active_data().iloc[row].name
|
95 |
+
|
96 |
+
|
97 |
+
def commit() -> None:
|
98 |
+
"""Commit changes to the session state"""
|
99 |
+
for row in st.session_state.editor["edited_rows"]:
|
100 |
+
row_index = get_index(row)
|
101 |
+
for key, value in st.session_state.editor["edited_rows"][row].items():
|
102 |
+
st.session_state["leaderboard_data"].at[row_index, key] = value
|
103 |
+
|
104 |
+
|
105 |
# streamlit UI
|
106 |
leaderboard_data = load_data()
|
107 |
+
if "leaderboard_data" not in st.session_state:
|
108 |
+
st.session_state["leaderboard_data"] = leaderboard_data
|
109 |
+
|
110 |
tabs = st.tabs(["Leaderboard", "Submit model"])
|
111 |
|
112 |
with tabs[0]:
|
|
|
128 |
""",
|
129 |
unsafe_allow_html=True,
|
130 |
)
|
131 |
+
|
132 |
+
if not st.session_state["leaderboard_data"].empty:
|
133 |
+
name = st.text_input("Search for ...", on_change=commit)
|
134 |
+
if name == "":
|
135 |
+
st.session_state["leaderboard_data"].Active = True
|
136 |
+
else:
|
137 |
+
st.session_state["leaderboard_data"].Active = False
|
138 |
+
st.session_state["leaderboard_data"].loc[
|
139 |
+
st.session_state["leaderboard_data"]["Model"].str.contains(name, case=False), "Active"
|
140 |
+
] = True
|
141 |
+
|
142 |
+
edited_data = st.data_editor(
|
143 |
+
active_data(), column_order=columns, key="editor", hide_index=False,
|
144 |
column_config={"Model": st.column_config.LinkColumn("Model")},
|
|
|
145 |
)
|
146 |
else:
|
147 |
st.write("No data found to display on leaderboard.")
|