Update README.md
Browse files
README.md
CHANGED
|
@@ -197,7 +197,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-float8dq
|
|
| 197 |
| | Phi-4 mini-Ins | phi4-mini-float8dq |
|
| 198 |
| **Popular aggregated benchmark** | | |
|
| 199 |
| mmlu (0-shot) | 66.73 | 66.61 |
|
| 200 |
-
| mmlu_pro (5-shot) | 46.43 |
|
| 201 |
| **Reasoning** | | |
|
| 202 |
| arc_challenge (0-shot) | 56.91 | 56.66 |
|
| 203 |
| gpqa_main_zeroshot | 30.13 | 29.46 |
|
|
@@ -212,7 +212,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-float8dq
|
|
| 212 |
| **Math** | | |
|
| 213 |
| gsm8k (5-shot) | 81.88 | 80.89 |
|
| 214 |
| mathqa (0-shot) | 42.31 | 42.51 |
|
| 215 |
-
| **Overall** | **55.35** | **
|
| 216 |
|
| 217 |
# Peak Memory Usage
|
| 218 |
|
|
|
|
| 197 |
| | Phi-4 mini-Ins | phi4-mini-float8dq |
|
| 198 |
| **Popular aggregated benchmark** | | |
|
| 199 |
| mmlu (0-shot) | 66.73 | 66.61 |
|
| 200 |
+
| mmlu_pro (5-shot) | 46.43 | 44.58 |
|
| 201 |
| **Reasoning** | | |
|
| 202 |
| arc_challenge (0-shot) | 56.91 | 56.66 |
|
| 203 |
| gpqa_main_zeroshot | 30.13 | 29.46 |
|
|
|
|
| 212 |
| **Math** | | |
|
| 213 |
| gsm8k (5-shot) | 81.88 | 80.89 |
|
| 214 |
| mathqa (0-shot) | 42.31 | 42.51 |
|
| 215 |
+
| **Overall** | **55.35** | **55.11** |
|
| 216 |
|
| 217 |
# Peak Memory Usage
|
| 218 |
|