Upload 10 files
Browse files- scripts/get_scores.py +7 -5
- scripts/helper.py +1 -1
- scripts/process_data.py +0 -1
scripts/get_scores.py
CHANGED
@@ -93,6 +93,8 @@ def load_negative_rejection_scores(config):
|
|
93 |
return df
|
94 |
|
95 |
def load_counterfactual_robustness_scores(config):
|
|
|
|
|
96 |
if not os.path.exists(Counterfactual_Robustness_DIR):
|
97 |
return pd.DataFrame(columns=["Model", "Accuracy with factual docs (%)", "Error Detection Rate", "Correction Rate (%)"])
|
98 |
|
@@ -109,14 +111,14 @@ def load_counterfactual_robustness_scores(config):
|
|
109 |
with open(filepath, "r") as f:
|
110 |
score = json.load(f)
|
111 |
score_data[model] = {
|
112 |
-
"Accuracy with factual docs (%)":
|
113 |
-
"Error Detection Rate":
|
114 |
"Correction Rate (%)": round(score.get("correct_rate", 0) * 100, 2) # 2 decimal places
|
115 |
}
|
116 |
else:
|
117 |
score_data[model] = { # Populate with "N/A" if file not found
|
118 |
"Accuracy with factual docs (%)": "N/A",
|
119 |
-
"Error Detection Rate": "N/A",
|
120 |
"Correction Rate (%)": "N/A"
|
121 |
}
|
122 |
|
@@ -124,8 +126,8 @@ def load_counterfactual_robustness_scores(config):
|
|
124 |
df = pd.DataFrame([
|
125 |
{
|
126 |
"Model": model,
|
127 |
-
"Accuracy with factual docs (%)": score_data[model]["Accuracy with factual docs (%)"],
|
128 |
-
"Error Detection Rate": score_data[model]["Error Detection Rate"],
|
129 |
"Correction Rate (%)": f"{score_data[model]['Correction Rate (%)']:.2f}" if score_data[model]["Correction Rate (%)"] != "N/A" else "N/A"
|
130 |
}
|
131 |
for model in config["models"]
|
|
|
93 |
return df
|
94 |
|
95 |
def load_counterfactual_robustness_scores(config):
|
96 |
+
#hard code noise rate to 0.4
|
97 |
+
config['noise_rate'] = 0.4
|
98 |
if not os.path.exists(Counterfactual_Robustness_DIR):
|
99 |
return pd.DataFrame(columns=["Model", "Accuracy with factual docs (%)", "Error Detection Rate", "Correction Rate (%)"])
|
100 |
|
|
|
111 |
with open(filepath, "r") as f:
|
112 |
score = json.load(f)
|
113 |
score_data[model] = {
|
114 |
+
"Accuracy with factual docs (%)": round(score.get("all_rate", 0) * 100, 2), # No decimal
|
115 |
+
"Error Detection Rate (%)": round(score.get("reject_rate", 0) * 100, 2),
|
116 |
"Correction Rate (%)": round(score.get("correct_rate", 0) * 100, 2) # 2 decimal places
|
117 |
}
|
118 |
else:
|
119 |
score_data[model] = { # Populate with "N/A" if file not found
|
120 |
"Accuracy with factual docs (%)": "N/A",
|
121 |
+
"Error Detection Rate (%)": "N/A",
|
122 |
"Correction Rate (%)": "N/A"
|
123 |
}
|
124 |
|
|
|
126 |
df = pd.DataFrame([
|
127 |
{
|
128 |
"Model": model,
|
129 |
+
"Accuracy with factual docs (%)": f"{score_data[model]['Accuracy with factual docs (%)']:.2f}" if score_data[model]["Accuracy with factual docs (%)"] != "N/A" else "N/A",
|
130 |
+
"Error Detection Rate": f"{score_data[model]['Error Detection Rate (%)']:.2f}" if score_data[model]["Error Detection Rate (%)"] != "N/A" else "N/A",
|
131 |
"Correction Rate (%)": f"{score_data[model]['Correction Rate (%)']:.2f}" if score_data[model]["Correction Rate (%)"] != "N/A" else "N/A"
|
132 |
}
|
133 |
for model in config["models"]
|
scripts/helper.py
CHANGED
@@ -81,7 +81,7 @@ def initialize_logging():
|
|
81 |
|
82 |
def get_logs():
|
83 |
"""Retrieve logs for display."""
|
84 |
-
return "\n".join(logs[-
|
85 |
|
86 |
def load_used_data(filepath):
|
87 |
"""Loads existing processed data to avoid redundant evaluations."""
|
|
|
81 |
|
82 |
def get_logs():
|
83 |
"""Retrieve logs for display."""
|
84 |
+
return "\n".join(logs[-1000:])
|
85 |
|
86 |
def load_used_data(filepath):
|
87 |
"""Loads existing processed data to avoid redundant evaluations."""
|
scripts/process_data.py
CHANGED
@@ -3,7 +3,6 @@ import random
|
|
3 |
import math
|
4 |
|
5 |
def process_data(instance, noise_rate, passage_num, filename, correct_rate=0):
|
6 |
-
print(filename)
|
7 |
"""Process the data for generating a noisy document set."""
|
8 |
query = instance['query']
|
9 |
ans = instance['answer']
|
|
|
3 |
import math
|
4 |
|
5 |
def process_data(instance, noise_rate, passage_num, filename, correct_rate=0):
|
|
|
6 |
"""Process the data for generating a noisy document set."""
|
7 |
query = instance['query']
|
8 |
ans = instance['answer']
|