Spaces:
Running
Running
Upload folder using huggingface_hub
Browse files- app/draw_diagram.py +1 -0
- app/pages.py +27 -9
app/draw_diagram.py
CHANGED
@@ -341,6 +341,7 @@ def draw_only_acc(folder_name, category_one, category_two, sorted):
|
|
341 |
.stMultiSelect [data-baseweb=select] span{
|
342 |
max-width: 800px;
|
343 |
font-size: 0.9rem;
|
|
|
344 |
}
|
345 |
</style>
|
346 |
""", unsafe_allow_html=True)
|
|
|
341 |
.stMultiSelect [data-baseweb=select] span{
|
342 |
max-width: 800px;
|
343 |
font-size: 0.9rem;
|
344 |
+
color: blue; /* Change text color of selected options */
|
345 |
}
|
346 |
</style>
|
347 |
""", unsafe_allow_html=True)
|
app/pages.py
CHANGED
@@ -15,7 +15,7 @@ def dashboard():
|
|
15 |
seaeval_url = "https://seaeval.github.io/"
|
16 |
|
17 |
st.divider()
|
18 |
-
st.markdown("#### What is [SeaEval](%s)" % seaeval_url)
|
19 |
|
20 |
with st.container():
|
21 |
left_co, cent_co,last_co = st.columns(3)
|
@@ -26,7 +26,7 @@ def dashboard():
|
|
26 |
st.markdown('''
|
27 |
|
28 |
''')
|
29 |
-
st.markdown("##### A new benchmark for multilingual foundation
|
30 |
st.markdown(''':star: How models understand and reason with natural language?
|
31 |
:balloon: Languages: English, Chinese, Malay, Spainish, Indonedian, Vietnamese, Filipino.
|
32 |
''')
|
@@ -104,11 +104,15 @@ def cultural_reasoning():
|
|
104 |
st.title("Cultural Reasoning")
|
105 |
|
106 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
107 |
-
filters_leveltwo = [
|
108 |
-
'SG EVAL V1 Cleaned',
|
109 |
'SG EVAL V2 MCQ',
|
110 |
'SG EVAL V2 Open Ended',
|
111 |
-
'
|
|
|
|
|
|
|
|
|
|
|
112 |
|
113 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
114 |
'Few Shot': 'few_shot'}
|
@@ -132,7 +136,13 @@ def general_reasoning():
|
|
132 |
st.title("General Reasoning")
|
133 |
|
134 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
135 |
-
filters_leveltwo = [
|
|
|
|
|
|
|
|
|
|
|
|
|
136 |
|
137 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
138 |
'Few Shot': 'few_shot'}
|
@@ -158,7 +168,8 @@ def flores():
|
|
158 |
filters_leveltwo = ['Indonesian to English',
|
159 |
'Vitenamese to English',
|
160 |
'Chinese to English',
|
161 |
-
'Malay to English'
|
|
|
162 |
|
163 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
164 |
'Few Shot': 'few_shot'}
|
@@ -182,7 +193,10 @@ def emotion():
|
|
182 |
st.title("Emotion")
|
183 |
|
184 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
185 |
-
filters_leveltwo = [
|
|
|
|
|
|
|
186 |
|
187 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
188 |
'Few Shot': 'few_shot'}
|
@@ -205,7 +219,11 @@ def dialogue():
|
|
205 |
st.title("Dialogue")
|
206 |
|
207 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
208 |
-
filters_leveltwo = [
|
|
|
|
|
|
|
|
|
209 |
|
210 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
211 |
'Few Shot': 'few_shot'}
|
|
|
15 |
seaeval_url = "https://seaeval.github.io/"
|
16 |
|
17 |
st.divider()
|
18 |
+
st.markdown("#### What is [SeaEval](%s)?" % seaeval_url)
|
19 |
|
20 |
with st.container():
|
21 |
left_co, cent_co,last_co = st.columns(3)
|
|
|
26 |
st.markdown('''
|
27 |
|
28 |
''')
|
29 |
+
st.markdown("##### A new benchmark for multilingual, multicultral foundation model evaluation consisting of 28 dataset as the core and keep expanding over time.")
|
30 |
st.markdown(''':star: How models understand and reason with natural language?
|
31 |
:balloon: Languages: English, Chinese, Malay, Spainish, Indonedian, Vietnamese, Filipino.
|
32 |
''')
|
|
|
104 |
st.title("Cultural Reasoning")
|
105 |
|
106 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
107 |
+
filters_leveltwo = [
|
|
|
108 |
'SG EVAL V2 MCQ',
|
109 |
'SG EVAL V2 Open Ended',
|
110 |
+
'SG EVAL',
|
111 |
+
'SG EVAL V1 Cleaned',
|
112 |
+
'CN EVAL',
|
113 |
+
'PH EVAL',
|
114 |
+
'US EVAL'
|
115 |
+
]
|
116 |
|
117 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
118 |
'Few Shot': 'few_shot'}
|
|
|
136 |
st.title("General Reasoning")
|
137 |
|
138 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
139 |
+
filters_leveltwo = [
|
140 |
+
'MMLU',
|
141 |
+
'CMMLU',
|
142 |
+
'IndoMMLU',
|
143 |
+
'C Eval',
|
144 |
+
'ZBench',
|
145 |
+
]
|
146 |
|
147 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
148 |
'Few Shot': 'few_shot'}
|
|
|
168 |
filters_leveltwo = ['Indonesian to English',
|
169 |
'Vitenamese to English',
|
170 |
'Chinese to English',
|
171 |
+
'Malay to English'
|
172 |
+
]
|
173 |
|
174 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
175 |
'Few Shot': 'few_shot'}
|
|
|
193 |
st.title("Emotion")
|
194 |
|
195 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
196 |
+
filters_leveltwo = [
|
197 |
+
'Indonesian Emotion Classification',
|
198 |
+
'SST2',
|
199 |
+
]
|
200 |
|
201 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
202 |
'Few Shot': 'few_shot'}
|
|
|
219 |
st.title("Dialogue")
|
220 |
|
221 |
filters_levelone = ['Zero Shot', 'Few Shot']
|
222 |
+
filters_leveltwo = [
|
223 |
+
'DREAM',
|
224 |
+
'SAMSum',
|
225 |
+
'DialogSum',
|
226 |
+
]
|
227 |
|
228 |
category_one_dict = {'Zero Shot': 'zero_shot',
|
229 |
'Few Shot': 'few_shot'}
|