Add GPQA Diamond evaluation result

This commit is contained in:
Nathan Habib 2026-03-02 13:35:24 +00:00 committed by system
parent 92725404d2
commit 7daa976d0c
No known key found for this signature in database
GPG Key ID: 6A528E38E0733467

8
.eval_results/gpqa.yaml Normal file

@ -0,0 +1,8 @@
- dataset:
id: Idavidrein/gpqa
task_id: diamond
value: 81.7
source:
url: https://huggingface.co/Qwen/Qwen3.5-9B
name: Model Card
user: SaylorTwift