Upload 6 files
Browse files- results/Noise Robustness/prediction_qwen-2.5-32b_noise_0.4_passage_5.json +0 -0
- results/Noise Robustness/prediction_qwen-2.5-32b_noise_0.6_passage_5.json +0 -0
- results/Noise Robustness/prediction_qwen-2.5-32b_noise_0.8_passage_5.json +0 -0
- results/Noise Robustness/scores_qwen-2.5-32b_noise_0.4_passage_5.json +4 -4
- results/Noise Robustness/scores_qwen-2.5-32b_noise_0.6_passage_5.json +4 -4
- results/Noise Robustness/scores_qwen-2.5-32b_noise_0.8_passage_5.json +9 -0
results/Noise Robustness/prediction_qwen-2.5-32b_noise_0.4_passage_5.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
results/Noise Robustness/prediction_qwen-2.5-32b_noise_0.6_passage_5.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
results/Noise Robustness/prediction_qwen-2.5-32b_noise_0.8_passage_5.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
results/Noise Robustness/scores_qwen-2.5-32b_noise_0.4_passage_5.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"model": "qwen-2.5-32b",
|
3 |
-
"accuracy": 0
|
4 |
"noise_rate": 0.4,
|
5 |
-
"correct_count":
|
6 |
"total": 50,
|
7 |
-
"all_rate": 0
|
8 |
-
"tt":
|
9 |
}
|
|
|
1 |
{
|
2 |
"model": "qwen-2.5-32b",
|
3 |
+
"accuracy": 1.0,
|
4 |
"noise_rate": 0.4,
|
5 |
+
"correct_count": 50,
|
6 |
"total": 50,
|
7 |
+
"all_rate": 1.0,
|
8 |
+
"tt": 50
|
9 |
}
|
results/Noise Robustness/scores_qwen-2.5-32b_noise_0.6_passage_5.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"model": "qwen-2.5-32b",
|
3 |
-
"accuracy": 0.
|
4 |
"noise_rate": 0.6,
|
5 |
-
"correct_count":
|
6 |
"total": 50,
|
7 |
-
"all_rate": 0.
|
8 |
-
"tt":
|
9 |
}
|
|
|
1 |
{
|
2 |
"model": "qwen-2.5-32b",
|
3 |
+
"accuracy": 0.96,
|
4 |
"noise_rate": 0.6,
|
5 |
+
"correct_count": 48,
|
6 |
"total": 50,
|
7 |
+
"all_rate": 0.96,
|
8 |
+
"tt": 48
|
9 |
}
|
results/Noise Robustness/scores_qwen-2.5-32b_noise_0.8_passage_5.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model": "qwen-2.5-32b",
|
3 |
+
"accuracy": 0.9,
|
4 |
+
"noise_rate": 0.8,
|
5 |
+
"correct_count": 45,
|
6 |
+
"total": 50,
|
7 |
+
"all_rate": 0.9,
|
8 |
+
"tt": 45
|
9 |
+
}
|