nm-research commited on
Commit
4000b0e
·
verified ·
1 Parent(s): 4443575

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +4 -4
README.md CHANGED
@@ -218,7 +218,7 @@ evalplus.evaluate \
218
  </thead>
219
  <tbody>
220
  <tr>
221
- <td rowspan="7"><b>OpenLLM v1</b></td>
222
  <td>ARC-Challenge (Acc-Norm, 25-shot)</td>
223
  <td>55.63</td>
224
  <td>54.18</td>
@@ -261,7 +261,7 @@ evalplus.evaluate \
261
  <td><b>99.29</b></td>
262
  </tr>
263
  <tr>
264
- <td rowspan="7"><b>OpenLLM v2</b></td>
265
  <td>IFEval (Inst Level Strict Acc, 0-shot)</td>
266
  <td>67.99</td>
267
  <td>67.63</td>
@@ -304,11 +304,11 @@ evalplus.evaluate \
304
  <td><b>99.84</b></td>
305
  </tr>
306
  <tr>
307
- <td rowspan="2"><b>HumanEval</b></td>
308
  <td>HumanEval Pass@1</td>
309
  <td>53.40</td>
310
  <td>52.30</td>
311
- <td>97.94</td>
312
  </tr>
313
  </tbody>
314
  </table>
 
218
  </thead>
219
  <tbody>
220
  <tr>
221
+ <td rowspan="7"><b>OpenLLM V1</b></td>
222
  <td>ARC-Challenge (Acc-Norm, 25-shot)</td>
223
  <td>55.63</td>
224
  <td>54.18</td>
 
261
  <td><b>99.29</b></td>
262
  </tr>
263
  <tr>
264
+ <td rowspan="7"><b>OpenLLM V2</b></td>
265
  <td>IFEval (Inst Level Strict Acc, 0-shot)</td>
266
  <td>67.99</td>
267
  <td>67.63</td>
 
304
  <td><b>99.84</b></td>
305
  </tr>
306
  <tr>
307
+ <td rowspan="2"><b>Coding</b></td>
308
  <td>HumanEval Pass@1</td>
309
  <td>53.40</td>
310
  <td>52.30</td>
311
+ <td><b>97.94</b></td>
312
  </tr>
313
  </tbody>
314
  </table>