Update README.md
Browse files
README.md
CHANGED
@@ -197,7 +197,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-float8dq
|
|
197 |
| | Phi-4 mini-Ins | phi4-mini-float8dq |
|
198 |
| **Popular aggregated benchmark** | | |
|
199 |
| mmlu (0-shot) | 66.73 | 66.61 |
|
200 |
-
| mmlu_pro (5-shot) | 46.43 |
|
201 |
| **Reasoning** | | |
|
202 |
| arc_challenge (0-shot) | 56.91 | 56.66 |
|
203 |
| gpqa_main_zeroshot | 30.13 | 29.46 |
|
@@ -212,7 +212,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-float8dq
|
|
212 |
| **Math** | | |
|
213 |
| gsm8k (5-shot) | 81.88 | 80.89 |
|
214 |
| mathqa (0-shot) | 42.31 | 42.51 |
|
215 |
-
| **Overall** | **55.35** | **
|
216 |
|
217 |
# Peak Memory Usage
|
218 |
|
|
|
197 |
| | Phi-4 mini-Ins | phi4-mini-float8dq |
|
198 |
| **Popular aggregated benchmark** | | |
|
199 |
| mmlu (0-shot) | 66.73 | 66.61 |
|
200 |
+
| mmlu_pro (5-shot) | 46.43 | 44.58 |
|
201 |
| **Reasoning** | | |
|
202 |
| arc_challenge (0-shot) | 56.91 | 56.66 |
|
203 |
| gpqa_main_zeroshot | 30.13 | 29.46 |
|
|
|
212 |
| **Math** | | |
|
213 |
| gsm8k (5-shot) | 81.88 | 80.89 |
|
214 |
| mathqa (0-shot) | 42.31 | 42.51 |
|
215 |
+
| **Overall** | **55.35** | **55.11** |
|
216 |
|
217 |
# Peak Memory Usage
|
218 |
|