PeterKruger's picture
Upload 7 files
11b5f6a verified
raw
history blame contribute delete
373 Bytes
{
"run_id": "agro1_2025-12-10",
"title": "AutoBench Agronomy LLM Benchmark - December 2025",
"date": "2025-12-10",
"description": "The first AutoBench run for the Agronomy domain with models Gemini 3 Pro, Gpt 5.1, Grok 4.1, Opus 4.5 and more",
"blog_url": "https://autobench.org/blog/autobench-Run-Agronomy-1",
"model_count": 40,
"is_latest": true
}