wdevazelhes commited on
Commit
da5cd28
1 Parent(s): d34c453

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -5
README.md CHANGED
@@ -158,7 +158,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
158
  <td rowspan="3">General</td>
159
  <td>MMLU (5-shot)</td>
160
  <td>31.1</td>
161
- <td>61</td>
162
  <td>50.2</td>
163
  <td>53.1</td>
164
  <td>42.5</td>
@@ -233,7 +233,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
233
  <td rowspan="4">CommonSense Understanding</td>
234
  <td>PIQA (0-shot)</td>
235
  <td>74.6</td>
236
- <td>76</td>
237
  <td>77.5</td>
238
  <td>79.2</td>
239
  <td>74.5</td>
@@ -249,7 +249,7 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
249
  <tr>
250
  <td>Winogrande (0-shot)</td>
251
  <td>60.4</td>
252
- <td>63</td>
253
  <td>66.1</td>
254
  <td>68.6</td>
255
  <td>61.2</td>
@@ -258,9 +258,9 @@ Falcon3-7B is trained on 256 H100 nodes (world size 2048).
258
  <td>OpenbookQA (0-shot)</td>
259
  <td>37.4</td>
260
  <td>40.4</td>
261
- <td>44</td>
262
  <td>41.8</td>
263
- <td>41</td>
264
  </tr>
265
  </tbody>
266
  </table>
 
158
  <td rowspan="3">General</td>
159
  <td>MMLU (5-shot)</td>
160
  <td>31.1</td>
161
+ <td>61.0</td>
162
  <td>50.2</td>
163
  <td>53.1</td>
164
  <td>42.5</td>
 
233
  <td rowspan="4">CommonSense Understanding</td>
234
  <td>PIQA (0-shot)</td>
235
  <td>74.6</td>
236
+ <td>76.0</td>
237
  <td>77.5</td>
238
  <td>79.2</td>
239
  <td>74.5</td>
 
249
  <tr>
250
  <td>Winogrande (0-shot)</td>
251
  <td>60.4</td>
252
+ <td>63.0</td>
253
  <td>66.1</td>
254
  <td>68.6</td>
255
  <td>61.2</td>
 
258
  <td>OpenbookQA (0-shot)</td>
259
  <td>37.4</td>
260
  <td>40.4</td>
261
+ <td>44.0</td>
262
  <td>41.8</td>
263
+ <td>41.0</td>
264
  </tr>
265
  </tbody>
266
  </table>