diff --git a/.eval_results/gpqa.yaml b/.eval_results/gpqa.yaml new file mode 100644 index 0000000..a0fac2a --- /dev/null +++ b/.eval_results/gpqa.yaml @@ -0,0 +1,8 @@ +- dataset: + id: Idavidrein/gpqa + task_id: diamond + value: 81.7 + source: + url: https://huggingface.co/Qwen/Qwen3.5-9B + name: Model Card + user: SaylorTwift