diff --git a/.eval_results/mmlu_pro.yaml b/.eval_results/mmlu_pro.yaml new file mode 100644 index 0000000..3542341 --- /dev/null +++ b/.eval_results/mmlu_pro.yaml @@ -0,0 +1,8 @@ +- dataset: + id: TIGER-Lab/MMLU-Pro + task_id: mmlu_pro + value: 82.5 + source: + url: https://huggingface.co/Qwen/Qwen3.5-9B + name: Model Card + user: SaylorTwift