wdevazelhes
commited on
Commit
•
da5cd28
1
Parent(s):
d34c453
Update README.md
Browse files
README.md
CHANGED
@@ -158,7 +158,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
158 |
<td rowspan="3">General</td>
|
159 |
<td>MMLU (5-shot)</td>
|
160 |
<td>31.1</td>
|
161 |
-
<td>61</td>
|
162 |
<td>50.2</td>
|
163 |
<td>53.1</td>
|
164 |
<td>42.5</td>
|
@@ -233,7 +233,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
233 |
<td rowspan="4">CommonSense Understanding</td>
|
234 |
<td>PIQA (0-shot)</td>
|
235 |
<td>74.6</td>
|
236 |
-
<td>76</td>
|
237 |
<td>77.5</td>
|
238 |
<td>79.2</td>
|
239 |
<td>74.5</td>
|
@@ -249,7 +249,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
249 |
<tr>
|
250 |
<td>Winogrande (0-shot)</td>
|
251 |
<td>60.4</td>
|
252 |
-
<td>63</td>
|
253 |
<td>66.1</td>
|
254 |
<td>68.6</td>
|
255 |
<td>61.2</td>
|
@@ -258,9 +258,9 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
258 |
<td>OpenbookQA (0-shot)</td>
|
259 |
<td>37.4</td>
|
260 |
<td>40.4</td>
|
261 |
-
<td>44</td>
|
262 |
<td>41.8</td>
|
263 |
-
<td>41</td>
|
264 |
</tr>
|
265 |
</tbody>
|
266 |
</table>
|
|
|
158 |
<td rowspan="3">General</td>
|
159 |
<td>MMLU (5-shot)</td>
|
160 |
<td>31.1</td>
|
161 |
+
<td>61.0</td>
|
162 |
<td>50.2</td>
|
163 |
<td>53.1</td>
|
164 |
<td>42.5</td>
|
|
|
233 |
<td rowspan="4">CommonSense Understanding</td>
|
234 |
<td>PIQA (0-shot)</td>
|
235 |
<td>74.6</td>
|
236 |
+
<td>76.0</td>
|
237 |
<td>77.5</td>
|
238 |
<td>79.2</td>
|
239 |
<td>74.5</td>
|
|
|
249 |
<tr>
|
250 |
<td>Winogrande (0-shot)</td>
|
251 |
<td>60.4</td>
|
252 |
+
<td>63.0</td>
|
253 |
<td>66.1</td>
|
254 |
<td>68.6</td>
|
255 |
<td>61.2</td>
|
|
|
258 |
<td>OpenbookQA (0-shot)</td>
|
259 |
<td>37.4</td>
|
260 |
<td>40.4</td>
|
261 |
+
<td>44.0</td>
|
262 |
<td>41.8</td>
|
263 |
+
<td>41.0</td>
|
264 |
</tr>
|
265 |
</tbody>
|
266 |
</table>
|