Update README.md (#3)
Browse files- Update README.md (da5cd28c7a09915250c732fa28b8bb9e8fab3cd3)
Co-authored-by: William de Vazelhes <[email protected]>
README.md
CHANGED
|
@@ -158,7 +158,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
| 158 |
<td rowspan="3">General</td>
|
| 159 |
<td>MMLU (5-shot)</td>
|
| 160 |
<td>31.1</td>
|
| 161 |
-
<td>61</td>
|
| 162 |
<td>50.2</td>
|
| 163 |
<td>53.1</td>
|
| 164 |
<td>42.5</td>
|
|
@@ -233,7 +233,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
| 233 |
<td rowspan="4">CommonSense Understanding</td>
|
| 234 |
<td>PIQA (0-shot)</td>
|
| 235 |
<td>74.6</td>
|
| 236 |
-
<td>76</td>
|
| 237 |
<td>77.5</td>
|
| 238 |
<td>79.2</td>
|
| 239 |
<td>74.5</td>
|
|
@@ -249,7 +249,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
| 249 |
<tr>
|
| 250 |
<td>Winogrande (0-shot)</td>
|
| 251 |
<td>60.4</td>
|
| 252 |
-
<td>63</td>
|
| 253 |
<td>66.1</td>
|
| 254 |
<td>68.6</td>
|
| 255 |
<td>61.2</td>
|
|
@@ -258,9 +258,9 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
|
|
| 258 |
<td>OpenbookQA (0-shot)</td>
|
| 259 |
<td>37.4</td>
|
| 260 |
<td>40.4</td>
|
| 261 |
-
<td>44</td>
|
| 262 |
<td>41.8</td>
|
| 263 |
-
<td>41</td>
|
| 264 |
</tr>
|
| 265 |
</tbody>
|
| 266 |
</table>
|
|
|
|
| 158 |
<td rowspan="3">General</td>
|
| 159 |
<td>MMLU (5-shot)</td>
|
| 160 |
<td>31.1</td>
|
| 161 |
+
<td>61.0</td>
|
| 162 |
<td>50.2</td>
|
| 163 |
<td>53.1</td>
|
| 164 |
<td>42.5</td>
|
|
|
|
| 233 |
<td rowspan="4">CommonSense Understanding</td>
|
| 234 |
<td>PIQA (0-shot)</td>
|
| 235 |
<td>74.6</td>
|
| 236 |
+
<td>76.0</td>
|
| 237 |
<td>77.5</td>
|
| 238 |
<td>79.2</td>
|
| 239 |
<td>74.5</td>
|
|
|
|
| 249 |
<tr>
|
| 250 |
<td>Winogrande (0-shot)</td>
|
| 251 |
<td>60.4</td>
|
| 252 |
+
<td>63.0</td>
|
| 253 |
<td>66.1</td>
|
| 254 |
<td>68.6</td>
|
| 255 |
<td>61.2</td>
|
|
|
|
| 258 |
<td>OpenbookQA (0-shot)</td>
|
| 259 |
<td>37.4</td>
|
| 260 |
<td>40.4</td>
|
| 261 |
+
<td>44.0</td>
|
| 262 |
<td>41.8</td>
|
| 263 |
+
<td>41.0</td>
|
| 264 |
</tr>
|
| 265 |
</tbody>
|
| 266 |
</table>
|