Spaces:
Restarting
on
CPU Upgrade
Restarting
on
CPU Upgrade
poquad
Browse files- src/about.py +3 -1
- src/display/utils.py +2 -1
src/about.py
CHANGED
@@ -40,7 +40,9 @@ class Tasks(Enum):
|
|
40 |
task25 = Task("polish_eq_bench_first_turn", "first_eqbench,none", "eq_bench_first_turn", "generate_until", 0.0)
|
41 |
task26 = Task("polish_eq_bench", "average_eqbench,none", "eq_bench", "generate_until", 0.0)
|
42 |
task20 = Task("polish_poleval2018_task3_test_10k", "word_perplexity,none", "poleval2018_task3_test_10k", "other")
|
43 |
-
|
|
|
|
|
44 |
|
45 |
|
46 |
g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generate_until"]
|
|
|
40 |
task25 = Task("polish_eq_bench_first_turn", "first_eqbench,none", "eq_bench_first_turn", "generate_until", 0.0)
|
41 |
task26 = Task("polish_eq_bench", "average_eqbench,none", "eq_bench", "generate_until", 0.0)
|
42 |
task20 = Task("polish_poleval2018_task3_test_10k", "word_perplexity,none", "poleval2018_task3_test_10k", "other")
|
43 |
+
task27 = Task("polish_poquad_reranking", "acc,none", "poquad_reranking", "other", 0.0)
|
44 |
+
task28 = Task("polish_abstractive_poquad_rag", "levenshtein,none", "abstractive_poquad_rag", "other", 0.0)
|
45 |
+
task29 = Task("polish_abstractive_poquad_open_book", "levenshtein,none", "abstractive_poquad_open_book", "other", 0.0)
|
46 |
|
47 |
|
48 |
g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generate_until"]
|
src/display/utils.py
CHANGED
@@ -37,7 +37,8 @@ auto_eval_column_dict.append(["average_mc", ColumnContent, ColumnContent("Avg mc
|
|
37 |
auto_eval_column_dict.append(["average_rag", ColumnContent, ColumnContent("Avg RAG", "number", True)])
|
38 |
|
39 |
for task in Tasks:
|
40 |
-
|
|
|
41 |
# Model information
|
42 |
|
43 |
auto_eval_column_dict.append(["model_type", ColumnContent, ColumnContent("Type", "str", False)])
|
|
|
37 |
auto_eval_column_dict.append(["average_rag", ColumnContent, ColumnContent("Avg RAG", "number", True)])
|
38 |
|
39 |
for task in Tasks:
|
40 |
+
show = task.name not in ['polish_poquad_reranking','polish_abstractive_poquad_rag','polish_abstractive_poquad_open_book']
|
41 |
+
auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", show)])
|
42 |
# Model information
|
43 |
|
44 |
auto_eval_column_dict.append(["model_type", ColumnContent, ColumnContent("Type", "str", False)])
|