Midm-LLM commited on
Commit
4262742
·
verified ·
1 Parent(s): 01af797

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +47 -47
README.md CHANGED
@@ -178,20 +178,20 @@ print(tokenizer.decode(output[0]))
178
  <td align="center">42.4</td>
179
  <td align="center">43.0</td>
180
  <td align="center">65.4</td>
181
- <td align="center"><u>74.0</u></td>
182
  <td align="center">68.9</td>
183
  </tr>
184
  <tr>
185
  <td><strong>Mi:dm 2.0-Mini-inst</strong></td>
186
- <td align="center"><u>66.4</u></td>
187
  <td align="center">61.4</td>
188
  <td align="center">36.7</td>
189
- <td align="center"><u>70.8</u></td>
190
  <td align="center">58.8</td>
191
  <td align="center">45.1</td>
192
  <td align="center">42.4</td>
193
  <td align="center">43.8</td>
194
- <td align="center"><u>73.3</u></td>
195
  <td align="center"><strong>74.0</strong></td>
196
  <td align="center"><strong>73.6</strong></td>
197
  </tr>
@@ -202,17 +202,17 @@ print(tokenizer.decode(output[0]))
202
  <!-- Large Models -->
203
  <tr>
204
  <td><strong>Qwen3-14B</strong></td>
205
- <td align="center"><u>72.4</u></td>
206
  <td align="center">65.7</td>
207
- <td align="center"><u>49.8</u></td>
208
  <td align="center">68.4</td>
209
  <td align="center">64.1</td>
210
- <td align="center"><u>55.4</u></td>
211
- <td align="center"><u>54.7</u></td>
212
- <td align="center"><u>55.1</u></td>
213
  <td align="center"><strong>83.6</strong></td>
214
  <td align="center">71</td>
215
- <td align="center"><u>77.3</u></td>
216
  </tr>
217
  <tr>
218
  <td><strong>Llama-3.1-8B-inst</strong></td>
@@ -231,15 +231,15 @@ print(tokenizer.decode(output[0]))
231
  <tr>
232
  <td><strong>Exaone-3.5-7.8B-inst</strong></td>
233
  <td align="center">71.6</td>
234
- <td align="center"><u>69.3</u></td>
235
  <td align="center">46.9</td>
236
- <td align="center"><u>72.9</u></td>
237
- <td align="center"><u>65.2</u></td>
238
  <td align="center">52.6</td>
239
  <td align="center">45.6</td>
240
  <td align="center">49.1</td>
241
  <td align="center">69.1</td>
242
- <td align="center"><u>79.6</u></td>
243
  <td align="center">74.4</td>
244
  </tr>
245
  <tr>
@@ -252,7 +252,7 @@ print(tokenizer.decode(output[0]))
252
  <td align="center"><strong>57.3</strong></td>
253
  <td align="center"><strong>58.0</strong></td>
254
  <td align="center"><strong>57.7</strong></td>
255
- <td align="center"><u>82</u></td>
256
  <td align="center"><strong>89.7</strong></td>
257
  <td align="center"><strong>85.9</strong></td>
258
  </tr>
@@ -296,9 +296,9 @@ print(tokenizer.decode(output[0]))
296
  <td><strong>Exaone-3.5-2.4B-inst</strong></td>
297
  <td align="center">68.7</td>
298
  <td align="center"><strong>58.5</strong></td>
299
- <td align="center"><u>87.2</u></td>
300
  <td align="center">38.0</td>
301
- <td align="center"><u>62.5</u></td>
302
  <td align="center">60.3</td>
303
  <td align="center">64.1</td>
304
  <td align="center">7.4</td>
@@ -312,11 +312,11 @@ print(tokenizer.decode(output[0]))
312
  <td align="center">80.5</td>
313
  <td align="center">42.5</td>
314
  <td align="center">61.9</td>
315
- <td align="center"><u>61.7</u></td>
316
- <td align="center"><u>64.5</u></td>
317
  <td align="center"><strong>7.7</strong></td>
318
- <td align="center"><u>39.9</u></td>
319
- <td align="center"><u>37.4</u></td>
320
  </tr>
321
 
322
  <!-- Visual Spacer -->
@@ -351,9 +351,9 @@ print(tokenizer.decode(output[0]))
351
  </tr>
352
  <tr>
353
  <td><strong>Exaone-3.5-7.8B-inst</strong></td>
354
- <td align="center"><u>73.5</u></td>
355
- <td align="center"><u>61.9</u></td>
356
- <td align="center"><u>92.0</u></td>
357
  <td align="center">44.0</td>
358
  <td align="center">67.2</td>
359
  <td align="center">64.6</td>
@@ -364,16 +364,16 @@ print(tokenizer.decode(output[0]))
364
  </tr>
365
  <tr>
366
  <td><strong>Mi:dm 2.0-Base-inst</strong></td>
367
- <td align="center"><u>86.5</u></td>
368
- <td align="center"><u>70.8</u></td>
369
  <td align="center"><strong>95.2</strong></td>
370
  <td align="center"><strong>53.0</strong></td>
371
- <td align="center"><u>76.1</u></td>
372
- <td align="center"><u>75.1</u></td>
373
- <td align="center"><u>73.0</u></td>
374
  <td align="center"><strong>8.6</strong></td>
375
- <td align="center"><u>52.9</u></td>
376
- <td align="center"><u>44.8</u></td>
377
  </tr>
378
  </table>
379
 
@@ -410,13 +410,13 @@ print(tokenizer.decode(output[0]))
410
  <!-- Small Models -->
411
  <tr>
412
  <td><strong>Qwen3-4B</strong></td>
413
- <td align="center"><u>79.7</u></td>
414
  <td align="center"><strong>79.0</strong></td>
415
- <td align="center"><u>39.8</u></td>
416
  <td align="center"><strong>58.5</strong></td>
417
  <td align="center"><strong>59.1</strong></td>
418
  <td align="center"><strong>90.4</strong></td>
419
- <td align="center"><u>62.4</u></td>
420
  <td align="center">-</td>
421
  <td align="center"><strong>73.3</strong></td>
422
  <td align="center"><strong>73.3</strong></td>
@@ -428,7 +428,7 @@ print(tokenizer.decode(output[0]))
428
  <td align="center">28.1</td>
429
  <td align="center">49.7</td>
430
  <td align="center">41.4</td>
431
- <td align="center"><u>82.5</u></td>
432
  <td align="center">59.8</td>
433
  <td align="center">-</td>
434
  <td align="center">59.5</td>
@@ -437,10 +437,10 @@ print(tokenizer.decode(output[0]))
437
  <tr>
438
  <td><strong>Mi:dm 2.0-Mini-inst</strong></td>
439
  <td align="center">73.6</td>
440
- <td align="center"><u>44.5</u></td>
441
  <td align="center">26.6</td>
442
- <td align="center"><u>51.7</u></td>
443
- <td align="center"><u>40.9</u></td>
444
  <td align="center">83.1</td>
445
  <td align="center"><strong>60.9</strong></td>
446
  <td align="center">-</td>
@@ -453,7 +453,7 @@ print(tokenizer.decode(output[0]))
453
  <!-- Large Models -->
454
  <tr>
455
  <td><strong>Qwen3-14B</strong></td>
456
- <td align="center"><u>83.9</u></td>
457
  <td align="center"><strong>83.4</strong></td>
458
  <td align="center"><strong>49.8</strong></td>
459
  <td align="center"><strong>57.7</strong></td>
@@ -467,23 +467,23 @@ print(tokenizer.decode(output[0]))
467
  <tr>
468
  <td><strong>Llama-3.1-8B-inst</strong></td>
469
  <td align="center">79.9</td>
470
- <td align="center"><u>60.3</u></td>
471
  <td align="center">21.6</td>
472
  <td align="center">50.3</td>
473
  <td align="center">44.1</td>
474
  <td align="center">81.2</td>
475
  <td align="center"><strong>81.8</strong></td>
476
  <td align="center">47.6</td>
477
- <td align="center"><u>70.7</u></td>
478
- <td align="center"><u>59.2</u></td>
479
  </tr>
480
  <tr>
481
  <td><strong>Exaone-3.5-7.8B-inst</strong></td>
482
  <td align="center">83.6</td>
483
  <td align="center">50.1</td>
484
- <td align="center"><u>33.1</u></td>
485
- <td align="center"><u>51.2</u></td>
486
- <td align="center"><u>44.8</u></td>
487
  <td align="center">81.1</td>
488
  <td align="center">79.4</td>
489
  <td align="center">40.7</td>
@@ -498,8 +498,8 @@ print(tokenizer.decode(output[0]))
498
  <td align="center">51.9</td>
499
  <td align="center">54.4</td>
500
  <td align="center"><strong>91.6</strong></td>
501
- <td align="center"><u>77.5</u></td>
502
- <td align="center"><u>53.3</u></td>
503
  <td align="center">73.7</td>
504
  <td align="center">63.5</td>
505
  </tr>
 
178
  <td align="center">42.4</td>
179
  <td align="center">43.0</td>
180
  <td align="center">65.4</td>
181
+ <td align="center"><strong>74.0</strong></td>
182
  <td align="center">68.9</td>
183
  </tr>
184
  <tr>
185
  <td><strong>Mi:dm 2.0-Mini-inst</strong></td>
186
+ <td align="center"><strong>66.4</strong></td>
187
  <td align="center">61.4</td>
188
  <td align="center">36.7</td>
189
+ <td align="center"><strong>70.8</strong></td>
190
  <td align="center">58.8</td>
191
  <td align="center">45.1</td>
192
  <td align="center">42.4</td>
193
  <td align="center">43.8</td>
194
+ <td align="center">73.3</td>
195
  <td align="center"><strong>74.0</strong></td>
196
  <td align="center"><strong>73.6</strong></td>
197
  </tr>
 
202
  <!-- Large Models -->
203
  <tr>
204
  <td><strong>Qwen3-14B</strong></td>
205
+ <td align="center">72.4<</td>
206
  <td align="center">65.7</td>
207
+ <td align="center">49.8</td>
208
  <td align="center">68.4</td>
209
  <td align="center">64.1</td>
210
+ <td align="center">55.4</td>
211
+ <td align="center">54.7</td>
212
+ <td align="center">55.1</td>
213
  <td align="center"><strong>83.6</strong></td>
214
  <td align="center">71</td>
215
+ <td align="center">77.3</td>
216
  </tr>
217
  <tr>
218
  <td><strong>Llama-3.1-8B-inst</strong></td>
 
231
  <tr>
232
  <td><strong>Exaone-3.5-7.8B-inst</strong></td>
233
  <td align="center">71.6</td>
234
+ <td align="center">69.3</td>
235
  <td align="center">46.9</td>
236
+ <td align="center">72.9</td>
237
+ <td align="center">65.2</td>
238
  <td align="center">52.6</td>
239
  <td align="center">45.6</td>
240
  <td align="center">49.1</td>
241
  <td align="center">69.1</td>
242
+ <td align="center">79.6</td>
243
  <td align="center">74.4</td>
244
  </tr>
245
  <tr>
 
252
  <td align="center"><strong>57.3</strong></td>
253
  <td align="center"><strong>58.0</strong></td>
254
  <td align="center"><strong>57.7</strong></td>
255
+ <td align="center">82</td>
256
  <td align="center"><strong>89.7</strong></td>
257
  <td align="center"><strong>85.9</strong></td>
258
  </tr>
 
296
  <td><strong>Exaone-3.5-2.4B-inst</strong></td>
297
  <td align="center">68.7</td>
298
  <td align="center"><strong>58.5</strong></td>
299
+ <td align="center">87.2</td>
300
  <td align="center">38.0</td>
301
+ <td align="center">62.5</td>
302
  <td align="center">60.3</td>
303
  <td align="center">64.1</td>
304
  <td align="center">7.4</td>
 
312
  <td align="center">80.5</td>
313
  <td align="center">42.5</td>
314
  <td align="center">61.9</td>
315
+ <td align="center">61.7</td>
316
+ <td align="center">64.5</td>
317
  <td align="center"><strong>7.7</strong></td>
318
+ <td align="center">39.9</td>
319
+ <td align="center">37.4</td>
320
  </tr>
321
 
322
  <!-- Visual Spacer -->
 
351
  </tr>
352
  <tr>
353
  <td><strong>Exaone-3.5-7.8B-inst</strong></td>
354
+ <td align="center">73.5</td>
355
+ <td align="center">61.9</td>
356
+ <td align="center">92.0</td>
357
  <td align="center">44.0</td>
358
  <td align="center">67.2</td>
359
  <td align="center">64.6</td>
 
364
  </tr>
365
  <tr>
366
  <td><strong>Mi:dm 2.0-Base-inst</strong></td>
367
+ <td align="center">86.5</td>
368
+ <td align="center">70.8</td>
369
  <td align="center"><strong>95.2</strong></td>
370
  <td align="center"><strong>53.0</strong></td>
371
+ <td align="center">76.1</td>
372
+ <td align="center">75.1</td>
373
+ <td align="center">73.0</td>
374
  <td align="center"><strong>8.6</strong></td>
375
+ <td align="center">52.9</td>
376
+ <td align="center">44.8</td>
377
  </tr>
378
  </table>
379
 
 
410
  <!-- Small Models -->
411
  <tr>
412
  <td><strong>Qwen3-4B</strong></td>
413
+ <td align="center">79.7</td>
414
  <td align="center"><strong>79.0</strong></td>
415
+ <td align="center"><strong>39.8</strong></td>
416
  <td align="center"><strong>58.5</strong></td>
417
  <td align="center"><strong>59.1</strong></td>
418
  <td align="center"><strong>90.4</strong></td>
419
+ <td align="center">62.4</td>
420
  <td align="center">-</td>
421
  <td align="center"><strong>73.3</strong></td>
422
  <td align="center"><strong>73.3</strong></td>
 
428
  <td align="center">28.1</td>
429
  <td align="center">49.7</td>
430
  <td align="center">41.4</td>
431
+ <td align="center">82.5</td>
432
  <td align="center">59.8</td>
433
  <td align="center">-</td>
434
  <td align="center">59.5</td>
 
437
  <tr>
438
  <td><strong>Mi:dm 2.0-Mini-inst</strong></td>
439
  <td align="center">73.6</td>
440
+ <td align="center">44.5</td>
441
  <td align="center">26.6</td>
442
+ <td align="center">51.7</td>
443
+ <td align="center">40.9</td>
444
  <td align="center">83.1</td>
445
  <td align="center"><strong>60.9</strong></td>
446
  <td align="center">-</td>
 
453
  <!-- Large Models -->
454
  <tr>
455
  <td><strong>Qwen3-14B</strong></td>
456
+ <td align="center">83.9</td>
457
  <td align="center"><strong>83.4</strong></td>
458
  <td align="center"><strong>49.8</strong></td>
459
  <td align="center"><strong>57.7</strong></td>
 
467
  <tr>
468
  <td><strong>Llama-3.1-8B-inst</strong></td>
469
  <td align="center">79.9</td>
470
+ <td align="center">60.3</td>
471
  <td align="center">21.6</td>
472
  <td align="center">50.3</td>
473
  <td align="center">44.1</td>
474
  <td align="center">81.2</td>
475
  <td align="center"><strong>81.8</strong></td>
476
  <td align="center">47.6</td>
477
+ <td align="center">70.7</td>
478
+ <td align="center">59.2</td>
479
  </tr>
480
  <tr>
481
  <td><strong>Exaone-3.5-7.8B-inst</strong></td>
482
  <td align="center">83.6</td>
483
  <td align="center">50.1</td>
484
+ <td align="center">33.1</td>
485
+ <td align="center">51.2</td>
486
+ <td align="center">44.8</td>
487
  <td align="center">81.1</td>
488
  <td align="center">79.4</td>
489
  <td align="center">40.7</td>
 
498
  <td align="center">51.9</td>
499
  <td align="center">54.4</td>
500
  <td align="center"><strong>91.6</strong></td>
501
+ <td align="center">77.5</td>
502
+ <td align="center">53.3</td>
503
  <td align="center">73.7</td>
504
  <td align="center">63.5</td>
505
  </tr>