[{"data":1,"prerenderedAt":6782},["ShallowReactive",2],{"benchmark-detail-ifeval":3},{"models":4,"benchmarkModels":2649,"benchmarkCatalog":5117,"benchmarkSources":5568,"monthlyFrontier":5569,"countryFrontier":6013,"totalModels":6779,"totalBenchmarkModels":6780,"dateRange":6781},[5,19,31,42,51,62,70,79,90,100,108,122,134,149,162,175,187,202,213,222,232,244,255,267,281,292,306,318,331,338,347,353,364,371,381,389,397,405,418,430,440,451,463,471,476,489,498,506,517,530,537,546,559,571,581,591,606,616,627,639,646,657,663,674,681,692,701,714,726,738,750,759,772,786,795,801,813,821,829,836,842,850,862,872,881,895,907,920,926,937,945,951,964,975,986,996,1005,1015,1025,1033,1043,1051,1060,1072,1080,1087,1094,1101,1114,1125,1137,1147,1159,1170,1176,1193,1212,1227,1244,1261,1273,1280,1288,1294,1300,1307,1316,1325,1333,1345,1358,1368,1380,1386,1392,1400,1409,1421,1430,1438,1444,1456,1462,1471,1478,1485,1493,1503,1512,1518,1529,1537,1544,1557,1564,1576,1583,1591,1601,1612,1619,1629,1637,1646,1653,1663,1670,1678,1687,1693,1702,1714,1722,1729,1736,1746,1756,1766,1773,1779,1787,1795,1801,1808,1814,1821,1829,1836,1846,1855,1862,1869,1878,1885,1891,1900,1907,1913,1924,1933,1945,1953,1959,1965,1971,1977,1988,1994,2000,2007,2015,2023,2031,2039,2046,2055,2064,2075,2082,2088,2099,2107,2116,2122,2128,2134,2141,2148,2157,2167,2173,2179,2185,2191,2200,2208,2217,2224,2231,2237,2243,2250,2256,2264,2270,2277,2285,2296,2302,2309,2316,2324,2331,2340,2352,2358,2364,2373,2386,2394,2401,2407,2415,2423,2430,2438,2446,2452,2463,2470,2477,2484,2490,2498,2505,2511,2518,2524,2530,2536,2543,2549,2555,2561,2567,2573,2580,2586,2593,2599,2605,2612,2619,2625,2631,2637,2643],{"provider_id":6,"slug":7,"model_name":8,"provider_name":9,"provider":10,"is_open":11,"author_country":12,"release_date":13,"release_month":14,"context_length":15,"input_price_per_1m_tokens":16,"output_price_per_1m_tokens":17,"input_price":16,"output_price":17,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":18,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4","openai-gpt-4","GPT-4","OpenAI","OpenAI GPT-4",false,null,1685232000,"2023-05",8191,30,60,67.7,{"provider_id":20,"slug":21,"model_name":22,"provider_name":9,"provider":23,"is_open":11,"author_country":12,"release_date":13,"release_month":14,"context_length":24,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":26,"input_price":25,"output_price":26,"benchmark_mmlu_pro":27,"benchmark_gpqa":28,"benchmark_aider":29,"benchmark_livecodebench":12,"benchmark_math_hard":30,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-3.5-turbo","openai-gpt-3.5-turbo","GPT-3.5 Turbo","OpenAI GPT-3.5 Turbo",16385,0.5,1.5,46.2,29.7,57.9,44.1,{"provider_id":32,"slug":33,"model_name":34,"provider_name":35,"provider":36,"is_open":37,"author_country":12,"release_date":38,"release_month":39,"context_length":40,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":41,"input_price":41,"output_price":41,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"gryphe:mythomax-l2-13b","gryphe-mythomax-l2-13b","MythoMax 13B","Gryphe","Gryphe MythoMax 13B",true,1688256000,"2023-07",4096,0.06,{"provider_id":43,"slug":44,"model_name":45,"provider_name":46,"provider":47,"is_open":37,"author_country":12,"release_date":48,"release_month":39,"context_length":49,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":50,"input_price":50,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"undi95:remm-slerp-l2-13b","undi95-remm-slerp-l2-13b","ReMM SLERP 13B","Undi95","Undi95 ReMM SLERP 13B",1689984000,6144,0.3,{"provider_id":52,"slug":53,"model_name":54,"provider_name":55,"provider":56,"is_open":11,"author_country":12,"release_date":57,"release_month":58,"context_length":59,"input_price_per_1m_tokens":60,"output_price_per_1m_tokens":61,"input_price":60,"output_price":61,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mancer:weaver","mancer-weaver","Weaver (alpha)","Mancer","Mancer Weaver (alpha)",1690934400,"2023-08",8000,0.75,1,{"provider_id":63,"slug":64,"model_name":65,"provider_name":9,"provider":66,"is_open":11,"author_country":12,"release_date":67,"release_month":58,"context_length":24,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":69,"input_price":68,"output_price":69,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-3.5-turbo-16k","openai-gpt-3.5-turbo-16k","GPT-3.5 Turbo 16k","OpenAI GPT-3.5 Turbo 16k",1693180800,3,4,{"provider_id":71,"slug":72,"model_name":73,"provider_name":9,"provider":74,"is_open":11,"author_country":12,"release_date":75,"release_month":76,"context_length":77,"input_price_per_1m_tokens":26,"output_price_per_1m_tokens":78,"input_price":26,"output_price":78,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-3.5-turbo-instruct","openai-gpt-3.5-turbo-instruct","GPT-3.5 Turbo Instruct","OpenAI GPT-3.5 Turbo Instruct",1695859200,"2023-09",4095,2,{"provider_id":80,"slug":81,"model_name":82,"provider_name":83,"provider":84,"is_open":11,"author_country":12,"release_date":75,"release_month":76,"context_length":85,"input_price_per_1m_tokens":86,"output_price_per_1m_tokens":87,"input_price":86,"output_price":87,"benchmark_mmlu_pro":88,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":89,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-7b-instruct-v0.1","mistral-ai-mistral-7b-instruct-v0.1","Mistral 7B Instruct v0.1","Mistral AI","Mistral AI Mistral 7B Instruct v0.1",2824,0.11,0.19,15.72,2.27,{"provider_id":91,"slug":92,"model_name":93,"provider_name":94,"provider":95,"is_open":37,"author_country":12,"release_date":96,"release_month":97,"context_length":49,"input_price_per_1m_tokens":98,"output_price_per_1m_tokens":99,"input_price":98,"output_price":99,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"alpindale:goliath-120b","alpindale-goliath-120b","Goliath 120B","Alpindale","Alpindale Goliath 120B",1699574400,"2023-11",3.75,7.5,{"provider_id":101,"slug":102,"model_name":103,"provider_name":104,"provider":105,"is_open":37,"author_country":12,"release_date":106,"release_month":97,"context_length":40,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":61,"input_price":107,"output_price":61,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"neversleep:noromaid-20b","neversleep-noromaid-20b","Noromaid 20B","Neversleep","Neversleep Noromaid 20B",1700956800,0.625,{"provider_id":109,"slug":110,"model_name":111,"provider_name":83,"provider":112,"is_open":37,"author_country":12,"release_date":113,"release_month":114,"context_length":115,"input_price_per_1m_tokens":116,"output_price_per_1m_tokens":117,"input_price":116,"output_price":117,"benchmark_mmlu_pro":118,"benchmark_gpqa":119,"benchmark_aider":12,"benchmark_livecodebench":120,"benchmark_math_hard":121,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mixtral-8x7b-instruct","mistral-ai-mixtral-8x7b-instruct","Mixtral 8x7B Instruct","Mistral AI Mixtral 8x7B Instruct",1702166400,"2023-12",32768,0.14,0.42,38.7,29.2,6.6,29.9,{"provider_id":123,"slug":124,"model_name":125,"provider_name":83,"provider":126,"is_open":37,"author_country":12,"release_date":127,"release_month":128,"context_length":129,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":26,"input_price":25,"output_price":26,"benchmark_mmlu_pro":130,"benchmark_gpqa":131,"benchmark_aider":12,"benchmark_livecodebench":132,"benchmark_math_hard":133,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-large","mistral-ai-mistral-large","Mistral Large","Mistral AI Mistral Large",1708905600,"2024-02",128000,51.5,35.1,17.8,52.7,{"provider_id":135,"slug":136,"model_name":137,"provider_name":138,"provider":139,"is_open":11,"author_country":12,"release_date":140,"release_month":141,"context_length":142,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":144,"input_price":143,"output_price":144,"benchmark_mmlu_pro":12,"benchmark_gpqa":145,"benchmark_aider":146,"benchmark_livecodebench":147,"benchmark_math_hard":148,"benchmark_aime":61,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"anthropic:claude-3-haiku","anthropic-claude-3-haiku","Claude 3 Haiku","Anthropic","Anthropic Claude 3 Haiku",1710288000,"2024-03",200000,0.25,1.25,37.4,47.4,15.4,39.4,{"provider_id":150,"slug":151,"model_name":152,"provider_name":9,"provider":153,"is_open":11,"author_country":12,"release_date":154,"release_month":155,"context_length":129,"input_price_per_1m_tokens":156,"output_price_per_1m_tokens":16,"input_price":156,"output_price":16,"benchmark_mmlu_pro":157,"benchmark_gpqa":12,"benchmark_aider":158,"benchmark_livecodebench":159,"benchmark_math_hard":160,"benchmark_aime":161,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4-turbo","openai-gpt-4-turbo","GPT-4 Turbo","OpenAI GPT-4 Turbo",1712620800,"2024-04",10,69.4,63.9,29.1,73.7,15,{"provider_id":163,"slug":164,"model_name":165,"provider_name":166,"provider":167,"is_open":37,"author_country":12,"release_date":168,"release_month":155,"context_length":169,"input_price_per_1m_tokens":170,"output_price_per_1m_tokens":170,"input_price":170,"output_price":170,"benchmark_mmlu_pro":171,"benchmark_gpqa":172,"benchmark_aider":173,"benchmark_livecodebench":12,"benchmark_math_hard":174,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"microsoft:wizardlm-2-8x22b","microsoft-wizardlm-2-8x22b","WizardLM-2 8x22B","Microsoft","Microsoft WizardLM-2 8x22B",1713225600,65535,0.62,39.96,17.56,44.4,25,{"provider_id":176,"slug":177,"model_name":178,"provider_name":83,"provider":179,"is_open":37,"author_country":12,"release_date":180,"release_month":155,"context_length":181,"input_price_per_1m_tokens":182,"output_price_per_1m_tokens":182,"input_price":182,"output_price":182,"benchmark_mmlu_pro":183,"benchmark_gpqa":184,"benchmark_aider":12,"benchmark_livecodebench":185,"benchmark_math_hard":186,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mixtral-8x22b-instruct","mistral-ai-mixtral-8x22b-instruct","Mixtral 8x22B Instruct","Mistral AI Mixtral 8x22B Instruct",1713312000,65536,1.2,53.7,33.2,14.8,54.5,{"provider_id":188,"slug":189,"model_name":190,"provider_name":191,"provider":192,"is_open":37,"author_country":12,"release_date":193,"release_month":155,"context_length":194,"input_price_per_1m_tokens":195,"output_price_per_1m_tokens":196,"input_price":195,"output_price":196,"benchmark_mmlu_pro":197,"benchmark_gpqa":198,"benchmark_aider":199,"benchmark_livecodebench":200,"benchmark_math_hard":201,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3-70b-instruct","meta-llama-llama-3-70b-instruct","Llama 3 70B Instruct","Meta-llama","Meta-llama Llama 3 70B Instruct",1713398400,8192,0.51,0.74,57.4,37.9,49.2,19.8,48.3,{"provider_id":203,"slug":204,"model_name":205,"provider_name":191,"provider":206,"is_open":37,"author_country":12,"release_date":193,"release_month":155,"context_length":194,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":208,"input_price":207,"output_price":208,"benchmark_mmlu_pro":209,"benchmark_gpqa":210,"benchmark_aider":12,"benchmark_livecodebench":211,"benchmark_math_hard":212,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3-8b-instruct","meta-llama-llama-3-8b-instruct","Llama 3 8B Instruct","Meta-llama Llama 3 8B Instruct",0.03,0.04,40.5,29.6,9.6,49.9,{"provider_id":214,"slug":215,"model_name":216,"provider_name":9,"provider":217,"is_open":11,"author_country":12,"release_date":218,"release_month":219,"context_length":129,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":221,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4o","openai-gpt-4o","GPT-4o","OpenAI GPT-4o",1715558400,"2024-05",2.5,74.4,{"provider_id":223,"slug":224,"model_name":225,"provider_name":226,"provider":227,"is_open":37,"author_country":12,"release_date":228,"release_month":219,"context_length":194,"input_price_per_1m_tokens":116,"output_price_per_1m_tokens":116,"input_price":116,"output_price":116,"benchmark_mmlu_pro":229,"benchmark_gpqa":230,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":231,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"nousresearch:hermes-2-pro-llama-3-8b","nousresearch-hermes-2-pro-llama-3-8b","Hermes 2 Pro - Llama-3 8B","Nousresearch","Nousresearch Hermes 2 Pro - Llama-3 8B",1716768000,22.8,5.7,8.38,{"provider_id":233,"slug":234,"model_name":235,"provider_name":236,"provider":237,"is_open":37,"author_country":12,"release_date":238,"release_month":239,"context_length":194,"input_price_per_1m_tokens":240,"output_price_per_1m_tokens":240,"input_price":240,"output_price":240,"benchmark_mmlu_pro":241,"benchmark_gpqa":242,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":243,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"sao10k:l3-euryale-70b","sao10k-l3-euryale-70b","Llama 3 Euryale 70B v2.1","Sao10k","Sao10k Llama 3 Euryale 70B v2.1",1718668800,"2024-06",1.48,45.51,10.85,22.43,{"provider_id":245,"slug":246,"model_name":247,"provider_name":248,"provider":249,"is_open":37,"author_country":12,"release_date":250,"release_month":239,"context_length":194,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":251,"input_price":207,"output_price":251,"benchmark_mmlu_pro":252,"benchmark_gpqa":253,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":254,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemma-2-9b-it","google-gemma-2-9b-it","Gemma 2 9B","Google","Google Gemma 2 9B",1719532800,0.08,31.95,14.77,19.49,{"provider_id":256,"slug":257,"model_name":258,"provider_name":248,"provider":259,"is_open":37,"author_country":12,"release_date":260,"release_month":261,"context_length":194,"input_price_per_1m_tokens":262,"output_price_per_1m_tokens":262,"input_price":262,"output_price":262,"benchmark_mmlu_pro":263,"benchmark_gpqa":264,"benchmark_aider":265,"benchmark_livecodebench":12,"benchmark_math_hard":266,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemma-2-27b-it","google-gemma-2-27b-it","Gemma 2 27B","Google Gemma 2 27B",1720828800,"2024-07",0.65,38.35,16.67,36.1,23.87,{"provider_id":268,"slug":269,"model_name":270,"provider_name":9,"provider":271,"is_open":11,"author_country":12,"release_date":272,"release_month":261,"context_length":129,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":274,"input_price":273,"output_price":274,"benchmark_mmlu_pro":275,"benchmark_gpqa":276,"benchmark_aider":277,"benchmark_livecodebench":278,"benchmark_math_hard":279,"benchmark_aime":280,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4o-mini","openai-gpt-4o-mini","GPT-4o-mini","OpenAI GPT-4o-mini",1721260800,0.15,0.6,64.8,42.6,55.6,23.4,78.9,11.7,{"provider_id":282,"slug":283,"model_name":284,"provider_name":83,"provider":285,"is_open":37,"author_country":12,"release_date":286,"release_month":261,"context_length":287,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":208,"input_price":288,"output_price":208,"benchmark_mmlu_pro":289,"benchmark_gpqa":290,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":291,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-nemo","mistral-ai-mistral-nemo","Mistral Nemo","Mistral AI Mistral Nemo",1721347200,131072,0.02,26.41,8.72,7.4,{"provider_id":293,"slug":294,"model_name":295,"provider_name":191,"provider":296,"is_open":37,"author_country":12,"release_date":297,"release_month":261,"context_length":298,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":299,"input_price":288,"output_price":299,"benchmark_mmlu_pro":300,"benchmark_gpqa":301,"benchmark_aider":302,"benchmark_livecodebench":303,"benchmark_math_hard":304,"benchmark_aime":305,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.1-8b-instruct","meta-llama-llama-3.1-8b-instruct","Llama 3.1 8B Instruct","Meta-llama Llama 3.1 8B Instruct",1721692800,16384,0.05,47.6,25.9,37.6,11.6,51.9,7.7,{"provider_id":307,"slug":308,"model_name":309,"provider_name":191,"provider":310,"is_open":37,"author_country":12,"release_date":297,"release_month":261,"context_length":311,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":312,"input_price":312,"output_price":312,"benchmark_mmlu_pro":313,"benchmark_gpqa":130,"benchmark_aider":314,"benchmark_livecodebench":315,"benchmark_math_hard":316,"benchmark_aime":317,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.1-405b-instruct","meta-llama-llama-3.1-405b-instruct","Llama 3.1 405B Instruct","Meta-llama Llama 3.1 405B Instruct",131000,0.9,73.2,66.2,30.5,70.3,21.3,{"provider_id":319,"slug":320,"model_name":321,"provider_name":191,"provider":322,"is_open":37,"author_country":12,"release_date":297,"release_month":261,"context_length":287,"input_price_per_1m_tokens":323,"output_price_per_1m_tokens":324,"input_price":323,"output_price":324,"benchmark_mmlu_pro":325,"benchmark_gpqa":326,"benchmark_aider":327,"benchmark_livecodebench":328,"benchmark_math_hard":329,"benchmark_aime":330,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.1-70b-instruct","meta-llama-llama-3.1-70b-instruct","Llama 3.1 70B Instruct","Meta-llama Llama 3.1 70B Instruct",0.34,0.39,67.6,40.9,58.6,23.2,64.9,17.3,{"provider_id":332,"slug":333,"model_name":334,"provider_name":191,"provider":335,"is_open":37,"author_country":12,"release_date":336,"release_month":337,"context_length":115,"input_price_per_1m_tokens":69,"output_price_per_1m_tokens":69,"input_price":69,"output_price":69,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.1-405b","meta-llama-llama-3.1-405b","Llama 3.1 405B (base)","Meta-llama Llama 3.1 405B (base)",1722556800,"2024-08",{"provider_id":339,"slug":340,"model_name":341,"provider_name":236,"provider":342,"is_open":37,"author_country":12,"release_date":343,"release_month":337,"context_length":194,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":299,"input_price":208,"output_price":299,"benchmark_mmlu_pro":344,"benchmark_gpqa":345,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":346,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"sao10k:l3-lunaris-8b","sao10k-l3-lunaris-8b","Llama 3 8B Lunaris","Sao10k Llama 3 8B Lunaris",1723507200,30.97,6.82,9.06,{"provider_id":348,"slug":349,"model_name":350,"provider_name":226,"provider":351,"is_open":37,"author_country":12,"release_date":352,"release_month":337,"context_length":287,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":61,"input_price":61,"output_price":61,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":158,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"nousresearch:hermes-3-llama-3.1-405b","nousresearch-hermes-3-llama-3.1-405b","Hermes 3 405B Instruct","Nousresearch Hermes 3 405B Instruct",1723766400,{"provider_id":354,"slug":355,"model_name":356,"provider_name":226,"provider":357,"is_open":37,"author_country":12,"release_date":358,"release_month":337,"context_length":181,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":50,"input_price":50,"output_price":50,"benchmark_mmlu_pro":359,"benchmark_gpqa":360,"benchmark_aider":12,"benchmark_livecodebench":361,"benchmark_math_hard":362,"benchmark_aime":363,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"nousresearch:hermes-3-llama-3.1-70b","nousresearch-hermes-3-llama-3.1-70b","Hermes 3 70B Instruct","Nousresearch Hermes 3 70B Instruct",1723939200,57.1,40.1,18.8,53.8,2.3,{"provider_id":365,"slug":366,"model_name":367,"provider_name":236,"provider":368,"is_open":37,"author_country":12,"release_date":369,"release_month":337,"context_length":115,"input_price_per_1m_tokens":370,"output_price_per_1m_tokens":370,"input_price":370,"output_price":370,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"sao10k:l3.1-euryale-70b","sao10k-l3.1-euryale-70b","Llama 3.1 Euryale 70B v2.2","Sao10k Llama 3.1 Euryale 70B v2.2",1724803200,0.85,{"provider_id":372,"slug":373,"model_name":374,"provider_name":375,"provider":376,"is_open":37,"author_country":12,"release_date":369,"release_month":337,"context_length":115,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"benchmark_mmlu_pro":378,"benchmark_gpqa":379,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":380,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-2.5-vl-7b-instruct","qwen-qwen-2.5-vl-7b-instruct","Qwen2.5-VL 7B Instruct","Qwen","Qwen Qwen2.5-VL 7B Instruct",0.2,34.39,9.28,19.86,{"provider_id":382,"slug":383,"model_name":384,"provider_name":385,"provider":386,"is_open":37,"author_country":12,"release_date":387,"release_month":337,"context_length":129,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":274,"input_price":273,"output_price":274,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":388,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"cohere:command-r-08-2024","cohere-command-r-08-2024","Command R (08-2024)","Cohere","Cohere Command R (08-2024)",1724976000,38.3,{"provider_id":390,"slug":391,"model_name":392,"provider_name":385,"provider":393,"is_open":37,"author_country":12,"release_date":387,"release_month":337,"context_length":129,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"benchmark_mmlu_pro":394,"benchmark_gpqa":395,"benchmark_aider":388,"benchmark_livecodebench":12,"benchmark_math_hard":396,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"cohere:command-r-plus-08-2024","cohere-command-r-plus-08-2024","Command R+ (08-2024)","Cohere Command R+ (08-2024)",38.01,13.42,12.39,{"provider_id":398,"slug":399,"model_name":400,"provider_name":104,"provider":401,"is_open":37,"author_country":12,"release_date":402,"release_month":403,"context_length":115,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":25,"input_price":404,"output_price":25,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"neversleep:llama-3.1-lumimaid-8b","neversleep-llama-3.1-lumimaid-8b","Lumimaid v0.2 8B","Neversleep Lumimaid v0.2 8B",1726358400,"2024-09",0.09,{"provider_id":406,"slug":407,"model_name":408,"provider_name":375,"provider":409,"is_open":37,"author_country":12,"release_date":410,"release_month":403,"context_length":115,"input_price_per_1m_tokens":411,"output_price_per_1m_tokens":324,"input_price":411,"output_price":324,"benchmark_mmlu_pro":412,"benchmark_gpqa":413,"benchmark_aider":414,"benchmark_livecodebench":415,"benchmark_math_hard":416,"benchmark_aime":417,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-2.5-72b-instruct","qwen-qwen-2.5-72b-instruct","Qwen2.5 72B Instruct","Qwen Qwen2.5 72B Instruct",1726704000,0.12,72,49.1,65.4,27.6,85.8,16,{"provider_id":419,"slug":420,"model_name":421,"provider_name":191,"provider":422,"is_open":37,"author_country":12,"release_date":423,"release_month":403,"context_length":424,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":299,"input_price":207,"output_price":299,"benchmark_mmlu_pro":425,"benchmark_gpqa":426,"benchmark_aider":12,"benchmark_livecodebench":427,"benchmark_math_hard":428,"benchmark_aime":429,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.2-3b-instruct","meta-llama-llama-3.2-3b-instruct","Llama 3.2 3B Instruct","Meta-llama Llama 3.2 3B Instruct",1727222400,80000,34.7,25.5,8.3,48.9,6.7,{"provider_id":431,"slug":432,"model_name":433,"provider_name":191,"provider":434,"is_open":37,"author_country":12,"release_date":423,"release_month":403,"context_length":435,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":288,"input_price":288,"output_price":288,"benchmark_mmlu_pro":436,"benchmark_gpqa":437,"benchmark_aider":12,"benchmark_livecodebench":438,"benchmark_math_hard":439,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.2-1b-instruct","meta-llama-llama-3.2-1b-instruct","Llama 3.2 1B Instruct","Meta-llama Llama 3.2 1B Instruct",60000,20,19.6,1.9,14,{"provider_id":441,"slug":442,"model_name":443,"provider_name":191,"provider":444,"is_open":37,"author_country":12,"release_date":423,"release_month":403,"context_length":287,"input_price_per_1m_tokens":445,"output_price_per_1m_tokens":445,"input_price":445,"output_price":445,"benchmark_mmlu_pro":446,"benchmark_gpqa":447,"benchmark_aider":12,"benchmark_livecodebench":448,"benchmark_math_hard":449,"benchmark_aime":450,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.2-11b-vision-instruct","meta-llama-llama-3.2-11b-vision-instruct","Llama 3.2 11B Vision Instruct","Meta-llama Llama 3.2 11B Vision Instruct",0.049,46.4,22.1,11,51.6,9.3,{"provider_id":452,"slug":453,"model_name":454,"provider_name":455,"provider":456,"is_open":37,"author_country":12,"release_date":457,"release_month":403,"context_length":115,"input_price_per_1m_tokens":458,"output_price_per_1m_tokens":459,"input_price":458,"output_price":459,"benchmark_mmlu_pro":460,"benchmark_gpqa":461,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":462,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"thedrummer:rocinante-12b","thedrummer-rocinante-12b","Rocinante 12B","Thedrummer","Thedrummer Rocinante 12B",1727654400,0.17,0.43,27.53,5.48,12.69,{"provider_id":464,"slug":465,"model_name":466,"provider_name":467,"provider":468,"is_open":11,"author_country":12,"release_date":469,"release_month":470,"context_length":59,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"inflection:inflection-3-pi","inflection-inflection-3-pi","Inflection 3 Pi","Inflection","Inflection Inflection 3 Pi",1728604800,"2024-10",{"provider_id":472,"slug":473,"model_name":474,"provider_name":467,"provider":475,"is_open":11,"author_country":12,"release_date":469,"release_month":470,"context_length":59,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"inflection:inflection-3-productivity","inflection-inflection-3-productivity","Inflection 3 Productivity","Inflection Inflection 3 Productivity",{"provider_id":477,"slug":478,"model_name":479,"provider_name":480,"provider":481,"is_open":11,"author_country":12,"release_date":482,"release_month":470,"context_length":287,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":312,"input_price":312,"output_price":312,"benchmark_mmlu_pro":483,"benchmark_gpqa":484,"benchmark_aider":485,"benchmark_livecodebench":486,"benchmark_math_hard":487,"benchmark_aime":488,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"nvidia:llama-3.1-nemotron-70b-instruct","nvidia-llama-3.1-nemotron-70b-instruct","Llama 3.1 Nemotron 70B Instruct","Nvidia","Nvidia Llama 3.1 Nemotron 70B Instruct",1728950400,69,46.5,54.9,16.9,73.3,24.7,{"provider_id":490,"slug":491,"model_name":492,"provider_name":375,"provider":493,"is_open":37,"author_country":12,"release_date":494,"release_month":470,"context_length":115,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":495,"input_price":208,"output_price":495,"benchmark_mmlu_pro":496,"benchmark_gpqa":461,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":497,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-2.5-7b-instruct","qwen-qwen-2.5-7b-instruct","Qwen2.5 7B Instruct","Qwen Qwen2.5 7B Instruct",1729036800,0.1,36.52,50,{"provider_id":499,"slug":500,"model_name":501,"provider_name":502,"provider":503,"is_open":37,"author_country":12,"release_date":504,"release_month":470,"context_length":298,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":505,"input_price":68,"output_price":505,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"anthracite-org:magnum-v4-72b","anthracite-org-magnum-v4-72b","Magnum v4 72B","Anthracite-org","Anthracite-org Magnum v4 72B",1729555200,5,{"provider_id":507,"slug":508,"model_name":509,"provider_name":138,"provider":510,"is_open":11,"author_country":12,"release_date":504,"release_month":470,"context_length":142,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":511,"benchmark_gpqa":512,"benchmark_aider":513,"benchmark_livecodebench":514,"benchmark_math_hard":515,"benchmark_aime":516,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"anthropic:claude-3.5-sonnet","anthropic-claude-3.5-sonnet","Claude 3.5 Sonnet","Anthropic Claude 3.5 Sonnet",77.2,59.9,84.2,38.1,77.1,15.7,{"provider_id":518,"slug":519,"model_name":520,"provider_name":138,"provider":521,"is_open":11,"author_country":12,"release_date":522,"release_month":523,"context_length":142,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":69,"input_price":524,"output_price":69,"benchmark_mmlu_pro":525,"benchmark_gpqa":526,"benchmark_aider":12,"benchmark_livecodebench":527,"benchmark_math_hard":528,"benchmark_aime":529,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"anthropic:claude-3.5-haiku","anthropic-claude-3.5-haiku","Claude 3.5 Haiku","Anthropic Claude 3.5 Haiku",1730678400,"2024-11",0.8,63.4,40.8,31.4,72.1,3.3,{"provider_id":531,"slug":532,"model_name":533,"provider_name":455,"provider":534,"is_open":37,"author_country":12,"release_date":535,"release_month":523,"context_length":115,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":536,"input_price":536,"output_price":536,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"thedrummer:unslopnemo-12b","thedrummer-unslopnemo-12b","UnslopNemo 12B","Thedrummer UnslopNemo 12B",1731103448,0.4,{"provider_id":538,"slug":539,"model_name":540,"provider_name":541,"provider":542,"is_open":37,"author_country":12,"release_date":543,"release_month":523,"context_length":544,"input_price_per_1m_tokens":545,"output_price_per_1m_tokens":545,"input_price":545,"output_price":545,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"raifle:sorcererlm-8x22b","raifle-sorcererlm-8x22b","SorcererLM 8x22B","Raifle","Raifle SorcererLM 8x22B",1731105083,16000,4.5,{"provider_id":547,"slug":548,"model_name":549,"provider_name":375,"provider":550,"is_open":37,"author_country":12,"release_date":551,"release_month":523,"context_length":115,"input_price_per_1m_tokens":552,"output_price_per_1m_tokens":524,"input_price":552,"output_price":524,"benchmark_mmlu_pro":553,"benchmark_gpqa":554,"benchmark_aider":555,"benchmark_livecodebench":556,"benchmark_math_hard":557,"benchmark_aime":558,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-2.5-coder-32b-instruct","qwen-qwen-2.5-coder-32b-instruct","Qwen2.5 Coder 32B Instruct","Qwen Qwen2.5 Coder 32B Instruct",1731368400,0.66,63.5,41.7,72.9,29.5,76.7,12,{"provider_id":560,"slug":561,"model_name":562,"provider_name":83,"provider":563,"is_open":37,"author_country":12,"release_date":564,"release_month":523,"context_length":287,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":565,"input_price":78,"output_price":565,"benchmark_mmlu_pro":566,"benchmark_gpqa":567,"benchmark_aider":12,"benchmark_livecodebench":568,"benchmark_math_hard":569,"benchmark_aime":570,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:pixtral-large-2411","mistral-ai-pixtral-large-2411","Pixtral Large 2411","Mistral AI Pixtral Large 2411",1731977388,6,70.1,50.5,26.1,71.4,7,{"provider_id":572,"slug":573,"model_name":574,"provider_name":83,"provider":575,"is_open":37,"author_country":12,"release_date":576,"release_month":523,"context_length":287,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":565,"input_price":78,"output_price":565,"benchmark_mmlu_pro":577,"benchmark_gpqa":578,"benchmark_aider":579,"benchmark_livecodebench":580,"benchmark_math_hard":569,"benchmark_aime":450,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-large-2407","mistral-ai-mistral-large-2407","Mistral Large 2407","Mistral AI Mistral Large 2407",1731978415,68.3,47.2,60.2,26.7,{"provider_id":582,"slug":583,"model_name":584,"provider_name":83,"provider":585,"is_open":11,"author_country":12,"release_date":586,"release_month":523,"context_length":287,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":565,"input_price":78,"output_price":565,"benchmark_mmlu_pro":587,"benchmark_gpqa":588,"benchmark_aider":414,"benchmark_livecodebench":589,"benchmark_math_hard":590,"benchmark_aime":448,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-large-2411","mistral-ai-mistral-large-2411","Mistral Large 2411","Mistral AI Mistral Large 2411",1731978685,69.7,48.6,29.3,73.6,{"provider_id":592,"slug":593,"model_name":594,"provider_name":595,"provider":596,"is_open":11,"author_country":12,"release_date":597,"release_month":598,"context_length":599,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":600,"input_price":524,"output_price":600,"benchmark_mmlu_pro":601,"benchmark_gpqa":212,"benchmark_aider":602,"benchmark_livecodebench":603,"benchmark_math_hard":604,"benchmark_aime":605,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"amazon:nova-pro-v1","amazon-nova-pro-v1","Nova Pro 1.0","Amazon","Amazon Nova Pro 1.0",1733436303,"2024-12",300000,3.2,69.1,54.1,23.3,78.6,10.7,{"provider_id":607,"slug":608,"model_name":609,"provider_name":595,"provider":610,"is_open":11,"author_country":12,"release_date":611,"release_month":598,"context_length":129,"input_price_per_1m_tokens":612,"output_price_per_1m_tokens":116,"input_price":612,"output_price":116,"benchmark_mmlu_pro":613,"benchmark_gpqa":614,"benchmark_aider":12,"benchmark_livecodebench":439,"benchmark_math_hard":316,"benchmark_aime":615,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"amazon:nova-micro-v1","amazon-nova-micro-v1","Nova Micro 1.0","Amazon Nova Micro 1.0",1733437237,0.035,53.1,35.8,8,{"provider_id":617,"slug":618,"model_name":619,"provider_name":595,"provider":620,"is_open":11,"author_country":12,"release_date":621,"release_month":598,"context_length":599,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":622,"input_price":41,"output_price":622,"benchmark_mmlu_pro":623,"benchmark_gpqa":624,"benchmark_aider":12,"benchmark_livecodebench":625,"benchmark_math_hard":626,"benchmark_aime":605,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"amazon:nova-lite-v1","amazon-nova-lite-v1","Nova Lite 1.0","Amazon Nova Lite 1.0",1733437363,0.24,59,43.3,16.7,76.5,{"provider_id":628,"slug":629,"model_name":630,"provider_name":191,"provider":631,"is_open":37,"author_country":12,"release_date":632,"release_month":598,"context_length":287,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":633,"input_price":495,"output_price":633,"benchmark_mmlu_pro":634,"benchmark_gpqa":635,"benchmark_aider":636,"benchmark_livecodebench":637,"benchmark_math_hard":638,"benchmark_aime":16,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-3.3-70b-instruct","meta-llama-llama-3.3-70b-instruct","Llama 3.3 70B Instruct","Meta-llama Llama 3.3 70B Instruct",1733506137,0.32,71.3,49.8,59.4,28.8,77.3,{"provider_id":640,"slug":641,"model_name":642,"provider_name":385,"provider":643,"is_open":37,"author_country":12,"release_date":644,"release_month":598,"context_length":129,"input_price_per_1m_tokens":645,"output_price_per_1m_tokens":273,"input_price":645,"output_price":273,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"cohere:command-r7b-12-2024","cohere-command-r7b-12-2024","Command R7B (12-2024)","Cohere Command R7B (12-2024)",1734158152,0.0375,{"provider_id":647,"slug":648,"model_name":649,"provider_name":9,"provider":650,"is_open":11,"author_country":12,"release_date":651,"release_month":598,"context_length":142,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":17,"input_price":161,"output_price":17,"benchmark_mmlu_pro":652,"benchmark_gpqa":653,"benchmark_aider":513,"benchmark_livecodebench":654,"benchmark_math_hard":655,"benchmark_aime":656,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o1","openai-o1","o1","OpenAI o1",1734459999,84.1,74.7,67.9,97,72.3,{"provider_id":658,"slug":659,"model_name":660,"provider_name":236,"provider":661,"is_open":37,"author_country":12,"release_date":662,"release_month":598,"context_length":287,"input_price_per_1m_tokens":262,"output_price_per_1m_tokens":60,"input_price":262,"output_price":60,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"sao10k:l3.3-euryale-70b","sao10k-l3.3-euryale-70b","Llama 3.3 Euryale 70B","Sao10k Llama 3.3 Euryale 70B",1734535928,{"provider_id":664,"slug":665,"model_name":666,"provider_name":667,"provider":668,"is_open":37,"author_country":12,"release_date":669,"release_month":598,"context_length":670,"input_price_per_1m_tokens":671,"output_price_per_1m_tokens":672,"input_price":671,"output_price":672,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":673,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-chat","deepseek-deepseek-chat","DeepSeek V3","Deepseek","Deepseek DeepSeek V3",1735241320,163840,0.014,0.028,48.4,{"provider_id":675,"slug":676,"model_name":677,"provider_name":236,"provider":678,"is_open":37,"author_country":12,"release_date":679,"release_month":680,"context_length":544,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":68,"input_price":68,"output_price":68,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"sao10k:l3.1-70b-hanami-x1","sao10k-l3.1-70b-hanami-x1","Llama 3.1 70B Hanami x1","Sao10k Llama 3.1 70B Hanami x1",1736302854,"2025-01",{"provider_id":682,"slug":683,"model_name":684,"provider_name":166,"provider":685,"is_open":37,"author_country":12,"release_date":686,"release_month":680,"context_length":298,"input_price_per_1m_tokens":687,"output_price_per_1m_tokens":116,"input_price":687,"output_price":116,"benchmark_mmlu_pro":569,"benchmark_gpqa":688,"benchmark_aider":12,"benchmark_livecodebench":689,"benchmark_math_hard":690,"benchmark_aime":691,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"microsoft:phi-4","microsoft-phi-4","Phi 4","Microsoft Phi 4",1736489872,0.065,57.5,23.1,81,14.3,{"provider_id":693,"slug":694,"model_name":695,"provider_name":696,"provider":697,"is_open":37,"author_country":12,"release_date":698,"release_month":680,"context_length":699,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":700,"input_price":377,"output_price":700,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-01","minimax-minimax-01","MiniMax-01","Minimax","Minimax MiniMax-01",1736915462,1000192,1.1,{"provider_id":702,"slug":703,"model_name":704,"provider_name":667,"provider":705,"is_open":11,"author_country":12,"release_date":706,"release_month":680,"context_length":707,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":78,"input_price":708,"output_price":78,"benchmark_mmlu_pro":709,"benchmark_gpqa":710,"benchmark_aider":711,"benchmark_livecodebench":712,"benchmark_math_hard":713,"benchmark_aime":577,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-r1","deepseek-deepseek-r1","R1","Deepseek R1",1737381095,64000,0.55,84.4,70.8,64,61.7,96.6,{"provider_id":715,"slug":716,"model_name":717,"provider_name":667,"provider":718,"is_open":37,"author_country":12,"release_date":719,"release_month":680,"context_length":287,"input_price_per_1m_tokens":720,"output_price_per_1m_tokens":524,"input_price":720,"output_price":524,"benchmark_mmlu_pro":721,"benchmark_gpqa":722,"benchmark_aider":12,"benchmark_livecodebench":723,"benchmark_math_hard":724,"benchmark_aime":725,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-r1-distill-llama-70b","deepseek-deepseek-r1-distill-llama-70b","R1 Distill Llama 70B","Deepseek R1 Distill Llama 70B",1737663169,0.7,79.5,40.2,26.6,93.5,67,{"provider_id":727,"slug":728,"model_name":729,"provider_name":730,"provider":731,"is_open":11,"author_country":12,"release_date":732,"release_month":680,"context_length":733,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":61,"input_price":61,"output_price":61,"benchmark_mmlu_pro":734,"benchmark_gpqa":735,"benchmark_aider":12,"benchmark_livecodebench":556,"benchmark_math_hard":736,"benchmark_aime":737,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"perplexity:sonar","perplexity-sonar","Sonar","Perplexity","Perplexity Sonar",1738013808,127072,68.9,47.1,81.7,48.7,{"provider_id":739,"slug":740,"model_name":741,"provider_name":667,"provider":742,"is_open":11,"author_country":12,"release_date":743,"release_month":680,"context_length":115,"input_price_per_1m_tokens":744,"output_price_per_1m_tokens":744,"input_price":744,"output_price":744,"benchmark_mmlu_pro":745,"benchmark_gpqa":746,"benchmark_aider":12,"benchmark_livecodebench":747,"benchmark_math_hard":748,"benchmark_aime":749,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-r1-distill-qwen-32b","deepseek-deepseek-r1-distill-qwen-32b","R1 Distill Qwen 32B","Deepseek R1 Distill Qwen 32B",1738194830,0.29,73.9,61.5,27,94.1,68.7,{"provider_id":751,"slug":752,"model_name":753,"provider_name":83,"provider":754,"is_open":37,"author_country":12,"release_date":755,"release_month":680,"context_length":115,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":251,"input_price":299,"output_price":251,"benchmark_mmlu_pro":756,"benchmark_gpqa":27,"benchmark_aider":12,"benchmark_livecodebench":757,"benchmark_math_hard":758,"benchmark_aime":615,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-small-24b-instruct-2501","mistral-ai-mistral-small-24b-instruct-2501","Mistral Small 24B Instruct 2501","Mistral AI Mistral Small 24B Instruct 2501",1738255409,65.2,25.2,71.5,{"provider_id":760,"slug":761,"model_name":762,"provider_name":9,"provider":763,"is_open":11,"author_country":12,"release_date":764,"release_month":680,"context_length":142,"input_price_per_1m_tokens":700,"output_price_per_1m_tokens":765,"input_price":700,"output_price":765,"benchmark_mmlu_pro":766,"benchmark_gpqa":767,"benchmark_aider":768,"benchmark_livecodebench":769,"benchmark_math_hard":770,"benchmark_aime":771,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o3-mini","openai-o3-mini","o3 Mini","OpenAI o3 Mini",1738351721,4.4,79.1,74.8,60.4,71.7,97.3,77,{"provider_id":773,"slug":774,"model_name":775,"provider_name":375,"provider":776,"is_open":11,"author_country":12,"release_date":777,"release_month":778,"context_length":115,"input_price_per_1m_tokens":779,"output_price_per_1m_tokens":780,"input_price":779,"output_price":780,"benchmark_mmlu_pro":781,"benchmark_gpqa":782,"benchmark_aider":783,"benchmark_livecodebench":784,"benchmark_math_hard":785,"benchmark_aime":603,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-max","qwen-qwen-max","Qwen-Max","Qwen Qwen-Max",1738402289,"2025-02",1.04,4.16,76.2,58.7,21.8,35.9,83.5,{"provider_id":787,"slug":788,"model_name":789,"provider_name":375,"provider":790,"is_open":11,"author_country":12,"release_date":791,"release_month":778,"context_length":792,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":794,"input_price":793,"output_price":794,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-plus","qwen-qwen-plus","Qwen-Plus","Qwen Qwen-Plus",1738409840,1000000,0.26,0.78,{"provider_id":796,"slug":797,"model_name":798,"provider_name":375,"provider":799,"is_open":37,"author_country":12,"release_date":800,"release_month":778,"context_length":115,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":524,"input_price":524,"output_price":524,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen2.5-vl-72b-instruct","qwen-qwen2.5-vl-72b-instruct","Qwen2.5 VL 72B Instruct","Qwen Qwen2.5 VL 72B Instruct",1738410311,{"provider_id":802,"slug":803,"model_name":804,"provider_name":375,"provider":805,"is_open":11,"author_country":12,"release_date":806,"release_month":778,"context_length":287,"input_price_per_1m_tokens":807,"output_price_per_1m_tokens":808,"input_price":807,"output_price":808,"benchmark_mmlu_pro":809,"benchmark_gpqa":810,"benchmark_aider":12,"benchmark_livecodebench":811,"benchmark_math_hard":812,"benchmark_aime":558,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-turbo","qwen-qwen-turbo","Qwen-Turbo","Qwen Qwen-Turbo",1738410974,0.0325,0.13,63.3,41,16.3,80.5,{"provider_id":814,"slug":815,"model_name":816,"provider_name":375,"provider":817,"is_open":11,"author_country":12,"release_date":818,"release_month":778,"context_length":287,"input_price_per_1m_tokens":819,"output_price_per_1m_tokens":820,"input_price":819,"output_price":820,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-vl-max","qwen-qwen-vl-max","Qwen VL Max","Qwen Qwen VL Max",1738434304,0.52,2.08,{"provider_id":822,"slug":823,"model_name":824,"provider_name":825,"provider":826,"is_open":11,"author_country":12,"release_date":827,"release_month":778,"context_length":115,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":828,"input_price":524,"output_price":828,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"aion-labs:aion-rp-llama-3.1-8b","aion-labs-aion-rp-llama-3.1-8b","Aion-RP 1.0 (8B)","Aion Labs","Aion Labs Aion-RP 1.0 (8B)",1738696718,1.6,{"provider_id":830,"slug":831,"model_name":832,"provider_name":825,"provider":833,"is_open":11,"author_country":12,"release_date":834,"release_month":778,"context_length":287,"input_price_per_1m_tokens":720,"output_price_per_1m_tokens":835,"input_price":720,"output_price":835,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"aion-labs:aion-1.0-mini","aion-labs-aion-1.0-mini","Aion-1.0-Mini","Aion Labs Aion-1.0-Mini",1738697107,1.4,{"provider_id":837,"slug":838,"model_name":839,"provider_name":825,"provider":840,"is_open":11,"author_country":12,"release_date":841,"release_month":778,"context_length":287,"input_price_per_1m_tokens":69,"output_price_per_1m_tokens":615,"input_price":69,"output_price":615,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"aion-labs:aion-1.0","aion-labs-aion-1.0","Aion-1.0","Aion Labs Aion-1.0",1738697557,{"provider_id":843,"slug":844,"model_name":845,"provider_name":375,"provider":846,"is_open":11,"author_country":12,"release_date":847,"release_month":778,"context_length":287,"input_price_per_1m_tokens":848,"output_price_per_1m_tokens":849,"input_price":848,"output_price":849,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-vl-plus","qwen-qwen-vl-plus","Qwen VL Plus","Qwen Qwen VL Plus",1738731255,0.1365,0.4095,{"provider_id":851,"slug":852,"model_name":853,"provider_name":248,"provider":854,"is_open":11,"author_country":12,"release_date":855,"release_month":778,"context_length":856,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"benchmark_mmlu_pro":857,"benchmark_gpqa":858,"benchmark_aider":12,"benchmark_livecodebench":859,"benchmark_math_hard":860,"benchmark_aime":861,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-2.0-flash-001","google-gemini-2.0-flash-001","Gemini 2.0 Flash","Google Gemini 2.0 Flash",1738769413,1048576,77.9,62.3,33.4,93,33,{"provider_id":863,"slug":864,"model_name":865,"provider_name":9,"provider":866,"is_open":11,"author_country":12,"release_date":867,"release_month":778,"context_length":142,"input_price_per_1m_tokens":700,"output_price_per_1m_tokens":765,"input_price":700,"output_price":765,"benchmark_mmlu_pro":868,"benchmark_gpqa":638,"benchmark_aider":12,"benchmark_livecodebench":869,"benchmark_math_hard":870,"benchmark_aime":871,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o3-mini-high","openai-o3-mini-high","o3 Mini High","OpenAI o3 Mini High",1739372611,80.2,73.4,98.5,86,{"provider_id":873,"slug":874,"model_name":875,"provider_name":83,"provider":876,"is_open":37,"author_country":12,"release_date":877,"release_month":778,"context_length":115,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":274,"input_price":377,"output_price":274,"benchmark_mmlu_pro":878,"benchmark_gpqa":879,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":18,"benchmark_aime":880,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-saba","mistral-ai-mistral-saba","Saba","Mistral AI Saba",1739803239,61.1,42.4,13,{"provider_id":882,"slug":883,"model_name":884,"provider_name":138,"provider":885,"is_open":11,"author_country":12,"release_date":886,"release_month":778,"context_length":142,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":887,"benchmark_gpqa":888,"benchmark_aider":329,"benchmark_livecodebench":148,"benchmark_math_hard":889,"benchmark_aime":890,"benchmark_mmlu_pro_reasoning":891,"benchmark_gpqa_reasoning":511,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":892,"benchmark_math_hard_reasoning":893,"benchmark_aime_reasoning":737,"benchmark_coding_reasoning":415,"benchmark_intelligence_reasoning":425,"benchmark_math_reasoning":894},"anthropic:claude-3.7-sonnet","anthropic-claude-3.7-sonnet","Claude 3.7 Sonnet","Anthropic Claude 3.7 Sonnet",1740422110,80.3,65.6,85,22.3,83.7,47.3,94.7,56.3,{"provider_id":896,"slug":897,"model_name":898,"provider_name":248,"provider":899,"is_open":11,"author_country":12,"release_date":900,"release_month":778,"context_length":856,"input_price_per_1m_tokens":901,"output_price_per_1m_tokens":50,"input_price":901,"output_price":50,"benchmark_mmlu_pro":902,"benchmark_gpqa":903,"benchmark_aider":12,"benchmark_livecodebench":904,"benchmark_math_hard":905,"benchmark_aime":906,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-2.0-flash-lite-001","google-gemini-2.0-flash-lite-001","Gemini 2.0 Flash Lite","Google Gemini 2.0 Flash Lite",1740506212,0.075,72.4,53.5,18.5,87.3,27.7,{"provider_id":908,"slug":909,"model_name":910,"provider_name":375,"provider":911,"is_open":37,"author_country":12,"release_date":912,"release_month":913,"context_length":115,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":914,"input_price":273,"output_price":914,"benchmark_mmlu_pro":275,"benchmark_gpqa":915,"benchmark_aider":916,"benchmark_livecodebench":917,"benchmark_math_hard":918,"benchmark_aime":919,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwq-32b","qwen-qwq-32b","QwQ 32B","Qwen QwQ 32B",1741208814,"2025-03",0.58,55.7,26.2,33.7,91,45.3,{"provider_id":921,"slug":922,"model_name":923,"provider_name":730,"provider":924,"is_open":11,"author_country":12,"release_date":925,"release_month":913,"context_length":129,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"perplexity:sonar-deep-research","perplexity-sonar-deep-research","Sonar Deep Research","Perplexity Sonar Deep Research",1741311246,{"provider_id":927,"slug":928,"model_name":929,"provider_name":730,"provider":930,"is_open":11,"author_country":12,"release_date":931,"release_month":913,"context_length":142,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":932,"benchmark_gpqa":933,"benchmark_aider":12,"benchmark_livecodebench":934,"benchmark_math_hard":935,"benchmark_aime":936,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"perplexity:sonar-pro","perplexity-sonar-pro","Sonar Pro","Perplexity Sonar Pro",1741312423,75.5,57.8,27.5,74.5,29,{"provider_id":938,"slug":939,"model_name":940,"provider_name":730,"provider":941,"is_open":11,"author_country":12,"release_date":942,"release_month":913,"context_length":129,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":943,"benchmark_aime":944,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"perplexity:sonar-reasoning-pro","perplexity-sonar-reasoning-pro","Sonar Reasoning Pro","Perplexity Sonar Reasoning Pro",1741313308,95.7,79,{"provider_id":946,"slug":947,"model_name":948,"provider_name":455,"provider":949,"is_open":37,"author_country":12,"release_date":950,"release_month":913,"context_length":115,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":524,"input_price":708,"output_price":524,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"thedrummer:skyfall-36b-v2","thedrummer-skyfall-36b-v2","Skyfall 36B V2","Thedrummer Skyfall 36B V2",1741636566,{"provider_id":952,"slug":953,"model_name":954,"provider_name":248,"provider":955,"is_open":37,"author_country":12,"release_date":956,"release_month":913,"context_length":129,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":957,"input_price":251,"output_price":957,"benchmark_mmlu_pro":958,"benchmark_gpqa":959,"benchmark_aider":960,"benchmark_livecodebench":961,"benchmark_math_hard":962,"benchmark_aime":963,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemma-3-27b-it","google-gemma-3-27b-it","Gemma 3 27B","Google Gemma 3 27B",1741756359,0.16,66.9,42.8,4.9,13.7,88.3,25.3,{"provider_id":965,"slug":966,"model_name":967,"provider_name":968,"provider":969,"is_open":11,"author_country":12,"release_date":970,"release_month":913,"context_length":181,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":377,"input_price":495,"output_price":377,"benchmark_mmlu_pro":958,"benchmark_gpqa":971,"benchmark_aider":12,"benchmark_livecodebench":972,"benchmark_math_hard":973,"benchmark_aime":974,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"reka:reka-flash-3","reka-reka-flash-3","Reka Flash 3","Reka","Reka Reka Flash 3",1741812813,52.9,43.5,89.3,51,{"provider_id":976,"slug":977,"model_name":978,"provider_name":385,"provider":979,"is_open":37,"author_country":12,"release_date":980,"release_month":913,"context_length":981,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"benchmark_mmlu_pro":982,"benchmark_gpqa":133,"benchmark_aider":558,"benchmark_livecodebench":983,"benchmark_math_hard":984,"benchmark_aime":985,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"cohere:command-a","cohere-command-a","Command A","Cohere Command A",1741894342,256000,71.2,28.7,81.9,9.7,{"provider_id":987,"slug":988,"model_name":989,"provider_name":248,"provider":990,"is_open":37,"author_country":12,"release_date":991,"release_month":913,"context_length":287,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":808,"input_price":208,"output_price":808,"benchmark_mmlu_pro":992,"benchmark_gpqa":993,"benchmark_aider":12,"benchmark_livecodebench":961,"benchmark_math_hard":994,"benchmark_aime":995,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemma-3-12b-it","google-gemma-3-12b-it","Gemma 3 12B","Google Gemma 3 12B",1741902625,59.5,34.9,85.3,22,{"provider_id":997,"slug":998,"model_name":999,"provider_name":248,"provider":1000,"is_open":37,"author_country":12,"release_date":1001,"release_month":913,"context_length":287,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":251,"input_price":208,"output_price":251,"benchmark_mmlu_pro":554,"benchmark_gpqa":159,"benchmark_aider":12,"benchmark_livecodebench":1002,"benchmark_math_hard":1003,"benchmark_aime":1004,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemma-3-4b-it","google-gemma-3-4b-it","Gemma 3 4B","Google Gemma 3 4B",1741905510,11.2,76.6,6.3,{"provider_id":1006,"slug":1007,"model_name":1008,"provider_name":1009,"provider":1010,"is_open":37,"author_country":12,"release_date":1011,"release_month":913,"context_length":129,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"benchmark_mmlu_pro":1012,"benchmark_gpqa":1013,"benchmark_aider":12,"benchmark_livecodebench":1014,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:olmo-2-0325-32b-instruct","allenai-olmo-2-0325-32b-instruct","Olmo 2 32B Instruct","Allenai","Allenai Olmo 2 32B Instruct",1741988556,51.1,32.8,6.8,{"provider_id":1016,"slug":1017,"model_name":1018,"provider_name":83,"provider":1019,"is_open":37,"author_country":12,"release_date":1020,"release_month":913,"context_length":129,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":86,"input_price":207,"output_price":86,"benchmark_mmlu_pro":1021,"benchmark_gpqa":1022,"benchmark_aider":12,"benchmark_livecodebench":1023,"benchmark_math_hard":1024,"benchmark_aime":450,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-small-3.1-24b-instruct","mistral-ai-mistral-small-3.1-24b-instruct","Mistral Small 3.1 24B","Mistral AI Mistral Small 3.1 24B",1742238937,65.9,45.4,21.2,70.7,{"provider_id":1026,"slug":1027,"model_name":1028,"provider_name":9,"provider":1029,"is_open":11,"author_country":12,"release_date":1030,"release_month":913,"context_length":142,"input_price_per_1m_tokens":1031,"output_price_per_1m_tokens":1032,"input_price":1031,"output_price":1032,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o1-pro","openai-o1-pro","o1-pro","OpenAI o1-pro",1742423211,150,600,{"provider_id":1034,"slug":1035,"model_name":1036,"provider_name":667,"provider":1037,"is_open":37,"author_country":12,"release_date":1038,"release_month":913,"context_length":670,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":1039,"input_price":377,"output_price":1039,"benchmark_mmlu_pro":1040,"benchmark_gpqa":915,"benchmark_aider":1041,"benchmark_livecodebench":784,"benchmark_math_hard":1042,"benchmark_aime":963,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-chat-v3-0324","deepseek-deepseek-chat-v3-0324","DeepSeek V3 0324","Deepseek DeepSeek V3 0324",1742824755,0.77,75.2,55.1,88.7,{"provider_id":1044,"slug":1045,"model_name":1046,"provider_name":375,"provider":1047,"is_open":37,"author_country":12,"release_date":1048,"release_month":913,"context_length":129,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":274,"input_price":377,"output_price":274,"benchmark_mmlu_pro":587,"benchmark_gpqa":1049,"benchmark_aider":12,"benchmark_livecodebench":1050,"benchmark_math_hard":812,"benchmark_aime":448,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen2.5-vl-32b-instruct","qwen-qwen2.5-vl-32b-instruct","Qwen2.5 VL 32B Instruct","Qwen Qwen2.5 VL 32B Instruct",1742839838,46.6,24.8,{"provider_id":1052,"slug":1053,"model_name":1054,"provider_name":191,"provider":1055,"is_open":37,"author_country":12,"release_date":1056,"release_month":1057,"context_length":1058,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":50,"input_price":251,"output_price":50,"benchmark_mmlu_pro":1040,"benchmark_gpqa":782,"benchmark_aider":12,"benchmark_livecodebench":121,"benchmark_math_hard":709,"benchmark_aime":1059,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-4-scout","meta-llama-llama-4-scout","Llama 4 Scout","Meta-llama Llama 4 Scout",1743881519,"2025-04",327680,28.3,{"provider_id":1061,"slug":1062,"model_name":1063,"provider_name":191,"provider":1064,"is_open":37,"author_country":12,"release_date":1065,"release_month":1057,"context_length":856,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":274,"input_price":273,"output_price":274,"benchmark_mmlu_pro":1066,"benchmark_gpqa":1067,"benchmark_aider":1068,"benchmark_livecodebench":1069,"benchmark_math_hard":1070,"benchmark_aime":1071,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meta-llama:llama-4-maverick","meta-llama-llama-4-maverick","Llama 4 Maverick","Meta-llama Llama 4 Maverick",1743881822,80.9,67.1,15.6,39.7,88.9,39,{"provider_id":1073,"slug":1074,"model_name":1075,"provider_name":1076,"provider":1077,"is_open":11,"author_country":12,"release_date":1078,"release_month":1057,"context_length":287,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":1079,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xai:grok-3-beta","xai-grok-3-beta","Grok 3 Beta","Xai","Xai Grok 3 Beta",1744240068,53.3,{"provider_id":1081,"slug":1082,"model_name":1083,"provider_name":1076,"provider":1084,"is_open":11,"author_country":12,"release_date":1085,"release_month":1057,"context_length":287,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":25,"input_price":50,"output_price":25,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":1086,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xai:grok-3-mini-beta","xai-grok-3-mini-beta","Grok 3 Mini Beta","Xai Grok 3 Mini Beta",1744240195,49.3,{"provider_id":1088,"slug":1089,"model_name":1090,"provider_name":1091,"provider":1092,"is_open":37,"author_country":12,"release_date":1093,"release_month":1057,"context_length":40,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":182,"input_price":524,"output_price":182,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"alfredpros:codellama-7b-instruct-solidity","alfredpros-codellama-7b-instruct-solidity","CodeLLaMa 7B Instruct Solidity","Alfredpros","Alfredpros CodeLLaMa 7B Instruct Solidity",1744641874,{"provider_id":1095,"slug":1096,"model_name":1097,"provider_name":1098,"provider":1099,"is_open":37,"author_country":12,"release_date":1100,"release_month":1057,"context_length":40,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":182,"input_price":524,"output_price":182,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"eleutherai:llemma_7b","eleutherai-llemma_7b","Llemma 7b","Eleutherai","Eleutherai Llemma 7b",1744643225,{"provider_id":1102,"slug":1103,"model_name":1104,"provider_name":9,"provider":1105,"is_open":11,"author_country":12,"release_date":1106,"release_month":1057,"context_length":1107,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"benchmark_mmlu_pro":1108,"benchmark_gpqa":1109,"benchmark_aider":1110,"benchmark_livecodebench":1111,"benchmark_math_hard":1112,"benchmark_aime":1113,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4.1-nano","openai-gpt-4.1-nano","GPT-4.1 Nano","OpenAI GPT-4.1 Nano",1744651369,1047576,65.7,51.2,8.9,32.6,84.8,23.7,{"provider_id":1115,"slug":1116,"model_name":1117,"provider_name":9,"provider":1118,"is_open":11,"author_country":12,"release_date":1119,"release_month":1057,"context_length":1107,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":524,"input_price":377,"output_price":524,"benchmark_mmlu_pro":1120,"benchmark_gpqa":1121,"benchmark_aider":1122,"benchmark_livecodebench":201,"benchmark_math_hard":1123,"benchmark_aime":1124,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4.1-mini","openai-gpt-4.1-mini","GPT-4.1 Mini","OpenAI GPT-4.1 Mini",1744651381,78.1,66.4,32.4,92.5,43,{"provider_id":1126,"slug":1127,"model_name":1128,"provider_name":9,"provider":1129,"is_open":11,"author_country":12,"release_date":1130,"release_month":1057,"context_length":1107,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"benchmark_mmlu_pro":1131,"benchmark_gpqa":1132,"benchmark_aider":1133,"benchmark_livecodebench":1134,"benchmark_math_hard":1135,"benchmark_aime":1136,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-4.1","openai-gpt-4.1","GPT-4.1","OpenAI GPT-4.1",1744651385,80.6,66.6,52.4,45.7,91.3,43.7,{"provider_id":1138,"slug":1139,"model_name":1140,"provider_name":375,"provider":1141,"is_open":37,"author_country":12,"release_date":1142,"release_month":1057,"context_length":115,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":404,"input_price":207,"output_price":404,"benchmark_mmlu_pro":892,"benchmark_gpqa":1143,"benchmark_aider":12,"benchmark_livecodebench":1144,"benchmark_math_hard":1145,"benchmark_aime":1146,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen2.5-coder-7b-instruct","qwen-qwen2.5-coder-7b-instruct","Qwen2.5 Coder 7B Instruct","Qwen Qwen2.5 Coder 7B Instruct",1744734887,33.9,12.6,66,5.3,{"provider_id":1148,"slug":1149,"model_name":1150,"provider_name":9,"provider":1151,"is_open":11,"author_country":12,"release_date":1152,"release_month":1057,"context_length":142,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":1153,"input_price":708,"output_price":1153,"benchmark_mmlu_pro":1154,"benchmark_gpqa":1155,"benchmark_aider":412,"benchmark_livecodebench":1156,"benchmark_math_hard":1157,"benchmark_aime":1158,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o4-mini","openai-o4-mini","o4 Mini","OpenAI o4 Mini",1744820942,2.2,83.2,78.4,85.9,98.9,94,{"provider_id":1160,"slug":1161,"model_name":1162,"provider_name":9,"provider":1163,"is_open":11,"author_country":12,"release_date":1164,"release_month":1057,"context_length":142,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"benchmark_mmlu_pro":994,"benchmark_gpqa":1165,"benchmark_aider":1166,"benchmark_livecodebench":1167,"benchmark_math_hard":1168,"benchmark_aime":1169,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o3","openai-o3","o3","OpenAI o3",1744823457,82.7,81.3,80.8,99.2,90.3,{"provider_id":1171,"slug":1172,"model_name":1173,"provider_name":9,"provider":1174,"is_open":11,"author_country":12,"release_date":1175,"release_month":1057,"context_length":142,"input_price_per_1m_tokens":700,"output_price_per_1m_tokens":765,"input_price":700,"output_price":765,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o4-mini-high","openai-o4-mini-high","o4 Mini High","OpenAI o4 Mini High",1744824212,{"provider_id":1177,"slug":1178,"model_name":1179,"provider_name":375,"provider":1180,"is_open":37,"author_country":12,"release_date":1181,"release_month":1057,"context_length":287,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":524,"input_price":536,"output_price":524,"benchmark_mmlu_pro":781,"benchmark_gpqa":1182,"benchmark_aider":1183,"benchmark_livecodebench":1184,"benchmark_math_hard":1185,"benchmark_aime":1186,"benchmark_mmlu_pro_reasoning":1187,"benchmark_gpqa_reasoning":1188,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1189,"benchmark_math_hard_reasoning":860,"benchmark_aime_reasoning":1190,"benchmark_coding_reasoning":1191,"benchmark_intelligence_reasoning":200,"benchmark_math_reasoning":1192},"qwen:qwen3-235b-a22b","qwen-qwen3-235b-a22b","Qwen3 235B A22B","Qwen Qwen3 235B A22B",1745875757,61.3,59.6,34.3,90.2,32.7,82.8,70,62.2,84,17.4,82,{"provider_id":1194,"slug":1195,"model_name":1196,"provider_name":375,"provider":1197,"is_open":37,"author_country":12,"release_date":1198,"release_month":1057,"context_length":1199,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":622,"input_price":251,"output_price":622,"benchmark_mmlu_pro":1200,"benchmark_gpqa":903,"benchmark_aider":1201,"benchmark_livecodebench":637,"benchmark_math_hard":1202,"benchmark_aime":1203,"benchmark_mmlu_pro_reasoning":1204,"benchmark_gpqa_reasoning":1205,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1206,"benchmark_math_hard_reasoning":1207,"benchmark_aime_reasoning":1208,"benchmark_coding_reasoning":1209,"benchmark_intelligence_reasoning":1210,"benchmark_math_reasoning":1211},"qwen:qwen3-32b","qwen-qwen3-32b","Qwen3 32B","Qwen Qwen3 32B",1745875945,40960,72.7,40,86.9,30.3,79.8,66.8,54.6,96.1,80.7,13.8,16.5,73,{"provider_id":1213,"slug":1214,"model_name":1215,"provider_name":375,"provider":1216,"is_open":37,"author_country":12,"release_date":1217,"release_month":1057,"context_length":1199,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":377,"input_price":41,"output_price":377,"benchmark_mmlu_pro":1218,"benchmark_gpqa":1219,"benchmark_aider":12,"benchmark_livecodebench":1220,"benchmark_math_hard":1221,"benchmark_aime":1220,"benchmark_mmlu_pro_reasoning":1222,"benchmark_gpqa_reasoning":768,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1223,"benchmark_math_hard_reasoning":1207,"benchmark_aime_reasoning":1224,"benchmark_coding_reasoning":1225,"benchmark_intelligence_reasoning":1226,"benchmark_math_reasoning":915},"qwen:qwen3-14b","qwen-qwen3-14b","Qwen3 14B","Qwen Qwen3 14B",1745876478,67.5,47,28,87.1,77.4,52.3,76.3,13.1,16.2,{"provider_id":1228,"slug":1229,"model_name":1230,"provider_name":375,"provider":1231,"is_open":37,"author_country":12,"release_date":1232,"release_month":1057,"context_length":1199,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"benchmark_mmlu_pro":1233,"benchmark_gpqa":1234,"benchmark_aider":12,"benchmark_livecodebench":1235,"benchmark_math_hard":1187,"benchmark_aime":1236,"benchmark_mmlu_pro_reasoning":1237,"benchmark_gpqa_reasoning":1238,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1239,"benchmark_math_hard_reasoning":1240,"benchmark_aime_reasoning":653,"benchmark_coding_reasoning":1241,"benchmark_intelligence_reasoning":1242,"benchmark_math_reasoning":1243},"qwen:qwen3-8b","qwen-qwen3-8b","Qwen3 8B","Qwen Qwen3 8B",1745876632,64.3,45.2,20.2,24.3,74.3,58.9,40.6,90.4,9,13.2,19,{"provider_id":1245,"slug":1246,"model_name":1247,"provider_name":375,"provider":1248,"is_open":37,"author_country":12,"release_date":1249,"release_month":1057,"context_length":1199,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":1250,"input_price":251,"output_price":1250,"benchmark_mmlu_pro":1251,"benchmark_gpqa":130,"benchmark_aider":12,"benchmark_livecodebench":1252,"benchmark_math_hard":1253,"benchmark_aime":1254,"benchmark_mmlu_pro_reasoning":1255,"benchmark_gpqa_reasoning":1256,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1257,"benchmark_math_hard_reasoning":1258,"benchmark_aime_reasoning":1259,"benchmark_coding_reasoning":448,"benchmark_intelligence_reasoning":1260,"benchmark_math_reasoning":656},"qwen:qwen3-30b-a3b","qwen-qwen3-30b-a3b","Qwen3 30B A3B","Qwen Qwen3 30B A3B",1745878604,0.28,71,32.2,86.3,26,77.7,61.6,50.6,95.9,75.3,15.3,{"provider_id":1262,"slug":1263,"model_name":1264,"provider_name":375,"provider":1265,"is_open":37,"author_country":12,"release_date":1266,"release_month":1057,"context_length":1199,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"benchmark_mmlu_pro":327,"benchmark_gpqa":1267,"benchmark_aider":12,"benchmark_livecodebench":603,"benchmark_math_hard":1268,"benchmark_aime":317,"benchmark_mmlu_pro_reasoning":1269,"benchmark_gpqa_reasoning":1270,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":484,"benchmark_math_hard_reasoning":1271,"benchmark_aime_reasoning":1108,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":1272,"benchmark_math_reasoning":890},"qwen:qwen3-4b","qwen-qwen3-4b","Qwen3 4B","Qwen Qwen3 4B",1746031104,39.8,84.3,69.6,52.2,93.3,14.2,{"provider_id":1274,"slug":1275,"model_name":1276,"provider_name":1277,"provider":1278,"is_open":11,"author_country":12,"release_date":1279,"release_month":1057,"context_length":129,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":60,"input_price":143,"output_price":60,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"inception:mercury-coder","inception-mercury-coder","Mercury Coder","Inception","Inception Mercury Coder",1746033880,{"provider_id":1281,"slug":1282,"model_name":1283,"provider_name":1284,"provider":1285,"is_open":37,"author_country":12,"release_date":1286,"release_month":1287,"context_length":115,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":524,"input_price":25,"output_price":524,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"arcee-ai:coder-large","arcee-ai-coder-large","Coder Large","Arcee AI","Arcee AI Coder Large",1746478663,"2025-05",{"provider_id":1289,"slug":1290,"model_name":1291,"provider_name":1284,"provider":1292,"is_open":37,"author_country":12,"release_date":1293,"release_month":1287,"context_length":287,"input_price_per_1m_tokens":60,"output_price_per_1m_tokens":182,"input_price":60,"output_price":182,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"arcee-ai:virtuoso-large","arcee-ai-virtuoso-large","Virtuoso Large","Arcee AI Virtuoso Large",1746478885,{"provider_id":1295,"slug":1296,"model_name":1297,"provider_name":1284,"provider":1298,"is_open":37,"author_country":12,"release_date":1299,"release_month":1287,"context_length":287,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":529,"input_price":312,"output_price":529,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"arcee-ai:maestro-reasoning","arcee-ai-maestro-reasoning","Maestro Reasoning","Arcee AI Maestro Reasoning",1746481269,{"provider_id":1301,"slug":1302,"model_name":1303,"provider_name":1284,"provider":1304,"is_open":37,"author_country":12,"release_date":1305,"release_month":1287,"context_length":287,"input_price_per_1m_tokens":1306,"output_price_per_1m_tokens":1306,"input_price":1306,"output_price":1306,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"arcee-ai:spotlight","arcee-ai-spotlight","Spotlight","Arcee AI Spotlight",1746481552,0.18,{"provider_id":1308,"slug":1309,"model_name":1310,"provider_name":248,"provider":1311,"is_open":11,"author_country":12,"release_date":1312,"release_month":1287,"context_length":856,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"benchmark_mmlu_pro":891,"benchmark_gpqa":1313,"benchmark_aider":1314,"benchmark_livecodebench":771,"benchmark_math_hard":1315,"benchmark_aime":1268,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-2.5-pro-preview-05-06","google-gemini-2.5-pro-preview-05-06","Gemini 2.5 Pro Preview 05-06","Google Gemini 2.5 Pro Preview 05-06",1746578513,82.2,76.9,98.6,{"provider_id":1317,"slug":1318,"model_name":1319,"provider_name":83,"provider":1320,"is_open":11,"author_country":12,"release_date":1321,"release_month":1287,"context_length":287,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"benchmark_mmlu_pro":1322,"benchmark_gpqa":933,"benchmark_aider":12,"benchmark_livecodebench":1201,"benchmark_math_hard":1323,"benchmark_aime":1324,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-medium-3","mistral-ai-mistral-medium-3","Mistral Medium 3","Mistral AI Mistral Medium 3",1746627341,76,90.7,44,{"provider_id":1326,"slug":1327,"model_name":1328,"provider_name":248,"provider":1329,"is_open":37,"author_country":12,"release_date":1330,"release_month":1287,"context_length":115,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":208,"input_price":288,"output_price":208,"benchmark_mmlu_pro":1331,"benchmark_gpqa":210,"benchmark_aider":12,"benchmark_livecodebench":1332,"benchmark_math_hard":515,"benchmark_aime":961,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemma-3n-e4b-it","google-gemma-3n-e4b-it","Gemma 3n 4B","Google Gemma 3n 4B",1747776824,48.8,14.6,{"provider_id":1334,"slug":1335,"model_name":1336,"provider_name":138,"provider":1337,"is_open":11,"author_country":12,"release_date":1338,"release_month":1287,"context_length":142,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":891,"benchmark_gpqa":577,"benchmark_aider":1182,"benchmark_livecodebench":1339,"benchmark_math_hard":1340,"benchmark_aime":1341,"benchmark_mmlu_pro_reasoning":513,"benchmark_gpqa_reasoning":1255,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1342,"benchmark_math_hard_reasoning":1343,"benchmark_aime_reasoning":638,"benchmark_coding_reasoning":1344,"benchmark_intelligence_reasoning":118,"benchmark_math_reasoning":1237},"anthropic:claude-sonnet-4","anthropic-claude-sonnet-4","Claude Sonnet 4","Anthropic Claude Sonnet 4",1747930371,44.9,93.4,40.7,65.5,99.1,34.1,{"provider_id":1346,"slug":1347,"model_name":1348,"provider_name":138,"provider":1349,"is_open":11,"author_country":12,"release_date":1350,"release_month":1287,"context_length":142,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1351,"input_price":161,"output_price":1351,"benchmark_mmlu_pro":871,"benchmark_gpqa":566,"benchmark_aider":412,"benchmark_livecodebench":1352,"benchmark_math_hard":748,"benchmark_aime":894,"benchmark_mmlu_pro_reasoning":905,"benchmark_gpqa_reasoning":1353,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1354,"benchmark_math_hard_reasoning":1355,"benchmark_aime_reasoning":1356,"benchmark_coding_reasoning":1357,"benchmark_intelligence_reasoning":1071,"benchmark_math_reasoning":487},"anthropic:claude-opus-4","anthropic-claude-opus-4","Claude Opus 4","Anthropic Claude Opus 4",1747931245,75,54.2,79.6,63.6,98.2,75.7,34,{"provider_id":1359,"slug":1360,"model_name":1361,"provider_name":667,"provider":1362,"is_open":11,"author_country":12,"release_date":1363,"release_month":1287,"context_length":670,"input_price_per_1m_tokens":1364,"output_price_per_1m_tokens":1365,"input_price":1364,"output_price":1365,"benchmark_mmlu_pro":1366,"benchmark_gpqa":1166,"benchmark_aider":569,"benchmark_livecodebench":771,"benchmark_math_hard":1367,"benchmark_aime":973,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-r1-0528","deepseek-deepseek-r1-0528","R1 0528","Deepseek R1 0528",1748455170,0.45,2.15,84.9,98.3,{"provider_id":1369,"slug":1370,"model_name":1371,"provider_name":248,"provider":1372,"is_open":11,"author_country":12,"release_date":1373,"release_month":1374,"context_length":856,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"benchmark_mmlu_pro":416,"benchmark_gpqa":1375,"benchmark_aider":1376,"benchmark_livecodebench":1377,"benchmark_math_hard":1378,"benchmark_aime":1379,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-2.5-pro-preview","google-gemini-2.5-pro-preview","Gemini 2.5 Pro Preview 06-05","Google Gemini 2.5 Pro Preview 06-05",1749137257,"2025-06",83.6,83.1,77.8,98,87,{"provider_id":1381,"slug":1382,"model_name":1383,"provider_name":1076,"provider":1384,"is_open":11,"author_country":12,"release_date":1385,"release_month":1374,"context_length":287,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xai:grok-3","xai-grok-3","Grok 3","Xai Grok 3",1749582908,{"provider_id":1387,"slug":1388,"model_name":1389,"provider_name":1076,"provider":1390,"is_open":11,"author_country":12,"release_date":1391,"release_month":1374,"context_length":287,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":25,"input_price":143,"output_price":25,"benchmark_mmlu_pro":1187,"benchmark_gpqa":766,"benchmark_aider":12,"benchmark_livecodebench":1269,"benchmark_math_hard":1168,"benchmark_aime":1271,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xai:grok-3-mini","xai-grok-3-mini","Grok 3 Mini","Xai Grok 3 Mini",1749583245,{"provider_id":1393,"slug":1394,"model_name":1395,"provider_name":9,"provider":1396,"is_open":11,"author_country":12,"release_date":1397,"release_month":1374,"context_length":142,"input_price_per_1m_tokens":436,"output_price_per_1m_tokens":1398,"input_price":436,"output_price":1398,"benchmark_mmlu_pro":12,"benchmark_gpqa":1399,"benchmark_aider":1366,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o3-pro","openai-o3-pro","o3 Pro","OpenAI o3 Pro",1749598352,80,84.5,{"provider_id":1401,"slug":1402,"model_name":1403,"provider_name":248,"provider":1404,"is_open":11,"author_country":12,"release_date":1405,"release_month":1374,"context_length":856,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":156,"input_price":61,"output_price":156,"benchmark_mmlu_pro":1406,"benchmark_gpqa":709,"benchmark_aider":12,"benchmark_livecodebench":1407,"benchmark_math_hard":1408,"benchmark_aime":1042,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-2.5-pro","google-gemini-2.5-pro","Gemini 2.5 Pro","Google Gemini 2.5 Pro",1750169544,86.2,80.1,96.7,{"provider_id":1410,"slug":1411,"model_name":1412,"provider_name":248,"provider":1413,"is_open":11,"author_country":12,"release_date":1414,"release_month":1374,"context_length":856,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":220,"input_price":50,"output_price":220,"benchmark_mmlu_pro":1066,"benchmark_gpqa":577,"benchmark_aider":1041,"benchmark_livecodebench":1415,"benchmark_math_hard":1416,"benchmark_aime":497,"benchmark_mmlu_pro_reasoning":1154,"benchmark_gpqa_reasoning":944,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1417,"benchmark_math_hard_reasoning":1418,"benchmark_aime_reasoning":1419,"benchmark_coding_reasoning":1420,"benchmark_intelligence_reasoning":747,"benchmark_math_reasoning":487},"google:gemini-2.5-flash","google-gemini-2.5-flash","Gemini 2.5 Flash","Google Gemini 2.5 Flash",1750172488,49.5,93.2,69.5,98.1,82.3,22.2,{"provider_id":1422,"slug":1423,"model_name":1424,"provider_name":696,"provider":1425,"is_open":37,"author_country":12,"release_date":1426,"release_month":1374,"context_length":792,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":1427,"input_price":536,"output_price":1427,"benchmark_mmlu_pro":1167,"benchmark_gpqa":1428,"benchmark_aider":12,"benchmark_livecodebench":1108,"benchmark_math_hard":1429,"benchmark_aime":1166,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-m1","minimax-minimax-m1","MiniMax M1","Minimax MiniMax M1",1750200414,1.76,68.2,97.2,{"provider_id":1431,"slug":1432,"model_name":1433,"provider_name":83,"provider":1434,"is_open":37,"author_country":12,"release_date":1435,"release_month":1374,"context_length":287,"input_price_per_1m_tokens":901,"output_price_per_1m_tokens":377,"input_price":901,"output_price":377,"benchmark_mmlu_pro":1436,"benchmark_gpqa":567,"benchmark_aider":12,"benchmark_livecodebench":934,"benchmark_math_hard":962,"benchmark_aime":1437,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-small-3.2-24b-instruct","mistral-ai-mistral-small-3.2-24b-instruct","Mistral Small 3.2 24B","Mistral AI Mistral Small 3.2 24B",1750443016,68.1,32.3,{"provider_id":1439,"slug":1440,"model_name":1441,"provider_name":1277,"provider":1442,"is_open":11,"author_country":12,"release_date":1443,"release_month":1374,"context_length":129,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":60,"input_price":143,"output_price":60,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"inception:mercury","inception-mercury","Mercury","Inception Mercury",1750973026,{"provider_id":1445,"slug":1446,"model_name":1447,"provider_name":1448,"provider":1449,"is_open":37,"author_country":12,"release_date":1450,"release_month":1374,"context_length":1451,"input_price_per_1m_tokens":1250,"output_price_per_1m_tokens":312,"input_price":1250,"output_price":312,"benchmark_mmlu_pro":1452,"benchmark_gpqa":1453,"benchmark_aider":12,"benchmark_livecodebench":1454,"benchmark_math_hard":1455,"benchmark_aime":1086,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"baidu:ernie-4.5-300b-a47b","baidu-ernie-4.5-300b-a47b","ERNIE 4.5 300B A47B","Baidu","Baidu ERNIE 4.5 300B A47B",1751300139,123000,77.6,81.1,46.7,93.1,{"provider_id":1457,"slug":1458,"model_name":1459,"provider_name":1448,"provider":1460,"is_open":37,"author_country":12,"release_date":1461,"release_month":1374,"context_length":1451,"input_price_per_1m_tokens":117,"output_price_per_1m_tokens":144,"input_price":117,"output_price":144,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"baidu:ernie-4.5-vl-424b-a47b","baidu-ernie-4.5-vl-424b-a47b","ERNIE 4.5 VL 424B A47B","Baidu ERNIE 4.5 VL 424B A47B",1751300903,{"provider_id":1463,"slug":1464,"model_name":1465,"provider_name":1466,"provider":1467,"is_open":11,"author_country":12,"release_date":1468,"release_month":1469,"context_length":1470,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":182,"input_price":524,"output_price":182,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"morph:morph-v3-fast","morph-morph-v3-fast","Morph V3 Fast","Morph","Morph Morph V3 Fast",1751910002,"2025-07",81920,{"provider_id":1472,"slug":1473,"model_name":1474,"provider_name":1466,"provider":1475,"is_open":11,"author_country":12,"release_date":1476,"release_month":1469,"context_length":1477,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":438,"input_price":312,"output_price":438,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"morph:morph-v3-large","morph-morph-v3-large","Morph V3 Large","Morph Morph V3 Large",1751910858,262144,{"provider_id":1479,"slug":1480,"model_name":1481,"provider_name":1482,"provider":1483,"is_open":37,"author_country":12,"release_date":1484,"release_month":1469,"context_length":670,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":700,"input_price":50,"output_price":700,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"tngtech:deepseek-r1t2-chimera","tngtech-deepseek-r1t2-chimera","DeepSeek R1T2 Chimera","Tngtech","Tngtech DeepSeek R1T2 Chimera",1751986985,{"provider_id":1486,"slug":1487,"model_name":1488,"provider_name":1489,"provider":1490,"is_open":11,"author_country":12,"release_date":1491,"release_month":1469,"context_length":287,"input_price_per_1m_tokens":116,"output_price_per_1m_tokens":1492,"input_price":116,"output_price":1492,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"tencent:hunyuan-a13b-instruct","tencent-hunyuan-a13b-instruct","Hunyuan A13B Instruct","Tencent","Tencent Hunyuan A13B Instruct",1751987664,0.57,{"provider_id":1494,"slug":1495,"model_name":1496,"provider_name":1076,"provider":1497,"is_open":11,"author_country":12,"release_date":1498,"release_month":1469,"context_length":981,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":1499,"benchmark_gpqa":1500,"benchmark_aider":1353,"benchmark_livecodebench":984,"benchmark_math_hard":1501,"benchmark_aime":1502,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xai:grok-4","xai-grok-4","Grok 4","Xai Grok 4",1752087689,86.6,87.7,99,94.3,{"provider_id":1504,"slug":1505,"model_name":1506,"provider_name":83,"provider":1507,"is_open":37,"author_country":12,"release_date":1508,"release_month":1469,"context_length":287,"input_price_per_1m_tokens":1509,"output_price_per_1m_tokens":1250,"input_price":1509,"output_price":1250,"benchmark_mmlu_pro":1189,"benchmark_gpqa":1510,"benchmark_aider":12,"benchmark_livecodebench":1511,"benchmark_math_hard":553,"benchmark_aime":50,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:devstral-small","mistral-ai-devstral-small","Devstral Small 1.1","Mistral AI Devstral Small 1.1",1752160751,0.07,41.4,25.4,{"provider_id":1513,"slug":1514,"model_name":1515,"provider_name":83,"provider":1516,"is_open":37,"author_country":12,"release_date":1517,"release_month":1469,"context_length":287,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"benchmark_mmlu_pro":710,"benchmark_gpqa":199,"benchmark_aider":12,"benchmark_livecodebench":917,"benchmark_math_hard":1024,"benchmark_aime":429,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:devstral-medium","mistral-ai-devstral-medium","Devstral Medium","Mistral AI Devstral Medium",1752161321,{"provider_id":1519,"slug":1520,"model_name":1521,"provider_name":1522,"provider":1523,"is_open":37,"author_country":12,"release_date":1524,"release_month":1469,"context_length":311,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":1153,"input_price":708,"output_price":1153,"benchmark_mmlu_pro":1525,"benchmark_gpqa":1003,"benchmark_aider":1526,"benchmark_livecodebench":277,"benchmark_math_hard":1527,"benchmark_aime":1528,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"moonshotai:kimi-k2","moonshotai-kimi-k2","Kimi K2 0711","Moonshotai","Moonshotai Kimi K2 0711",1752263252,82.4,59.1,97.1,69.3,{"provider_id":1530,"slug":1531,"model_name":1532,"provider_name":1533,"provider":1534,"is_open":11,"author_country":12,"release_date":1535,"release_month":1469,"context_length":287,"input_price_per_1m_tokens":370,"output_price_per_1m_tokens":1536,"input_price":370,"output_price":1536,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"switchpoint:router","switchpoint-router","Switchpoint Router","Switchpoint","Switchpoint Switchpoint Router",1752272899,3.4,{"provider_id":1538,"slug":1539,"model_name":1540,"provider_name":375,"provider":1541,"is_open":37,"author_country":12,"release_date":1542,"release_month":1469,"context_length":1477,"input_price_per_1m_tokens":1543,"output_price_per_1m_tokens":495,"input_price":1543,"output_price":495,"benchmark_mmlu_pro":1187,"benchmark_gpqa":1259,"benchmark_aider":12,"benchmark_livecodebench":1133,"benchmark_math_hard":1378,"benchmark_aime":769,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-235b-a22b-2507","qwen-qwen3-235b-a22b-2507","Qwen3 235B A22B Instruct 2507","Qwen Qwen3 235B A22B Instruct 2507",1753119555,0.071,{"provider_id":1545,"slug":1546,"model_name":1547,"provider_name":248,"provider":1548,"is_open":11,"author_country":12,"release_date":1549,"release_month":1469,"context_length":856,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"benchmark_mmlu_pro":902,"benchmark_gpqa":146,"benchmark_aider":12,"benchmark_livecodebench":1201,"benchmark_math_hard":1550,"benchmark_aime":497,"benchmark_mmlu_pro_reasoning":1551,"benchmark_gpqa_reasoning":1552,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1553,"benchmark_math_hard_reasoning":1554,"benchmark_aime_reasoning":316,"benchmark_coding_reasoning":1555,"benchmark_intelligence_reasoning":1556,"benchmark_math_reasoning":1079},"google:gemini-2.5-flash-lite","google-gemini-2.5-flash-lite","Gemini 2.5 Flash Lite","Google Gemini 2.5 Flash Lite",1753200276,92.6,75.9,62.5,59.3,96.9,9.5,17.6,{"provider_id":1558,"slug":1559,"model_name":1560,"provider_name":1561,"provider":1562,"is_open":37,"author_country":12,"release_date":1563,"release_month":1469,"context_length":129,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":377,"input_price":495,"output_price":377,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"bytedance:ui-tars-1.5-7b","bytedance-ui-tars-1.5-7b","UI-TARS 7B","Bytedance","Bytedance UI-TARS 7B",1753205056,{"provider_id":1565,"slug":1566,"model_name":1567,"provider_name":375,"provider":1568,"is_open":37,"author_country":12,"release_date":1569,"release_month":1469,"context_length":1477,"input_price_per_1m_tokens":1570,"output_price_per_1m_tokens":312,"input_price":1570,"output_price":312,"benchmark_mmlu_pro":1571,"benchmark_gpqa":1572,"benchmark_aider":12,"benchmark_livecodebench":1573,"benchmark_math_hard":1574,"benchmark_aime":1575,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-coder","qwen-qwen3-coder","Qwen3 Coder 480B A35B (exacto)","Qwen Qwen3 Coder 480B A35B (exacto)",1753230546,0.22,78.8,61.8,58.5,94.2,47.7,{"provider_id":1577,"slug":1578,"model_name":1579,"provider_name":1580,"provider":1581,"is_open":37,"author_country":12,"release_date":1582,"release_month":1469,"context_length":129,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":495,"input_price":495,"output_price":495,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"z-ai:glm-4-32b","z-ai-glm-4-32b","GLM 4 32B","Z-ai","Z-ai GLM 4 32B",1753376617,{"provider_id":1584,"slug":1585,"model_name":1586,"provider_name":375,"provider":1587,"is_open":37,"author_country":12,"release_date":1588,"release_month":1469,"context_length":1477,"input_price_per_1m_tokens":1589,"output_price_per_1m_tokens":312,"input_price":1589,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1268,"benchmark_gpqa_reasoning":944,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1571,"benchmark_math_hard_reasoning":1590,"benchmark_aime_reasoning":1158,"benchmark_coding_reasoning":328,"benchmark_intelligence_reasoning":556,"benchmark_math_reasoning":918},"qwen:qwen3-235b-a22b-thinking-2507","qwen-qwen3-235b-a22b-thinking-2507","Qwen3 235B A22B Thinking 2507","Qwen Qwen3 235B A22B Thinking 2507",1753449557,0.1495,98.4,{"provider_id":1592,"slug":1593,"model_name":1594,"provider_name":1580,"provider":1595,"is_open":37,"author_country":12,"release_date":1596,"release_month":1469,"context_length":287,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":370,"input_price":808,"output_price":370,"benchmark_mmlu_pro":1597,"benchmark_gpqa":487,"benchmark_aider":12,"benchmark_livecodebench":1598,"benchmark_math_hard":1599,"benchmark_aime":1600,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"z-ai:glm-4.5-air","z-ai-glm-4.5-air","GLM 4.5 Air","Z-ai GLM 4.5 Air",1753471258,81.5,68.4,96.5,67.3,{"provider_id":1602,"slug":1603,"model_name":1604,"provider_name":1580,"provider":1605,"is_open":37,"author_country":12,"release_date":1606,"release_month":1469,"context_length":287,"input_price_per_1m_tokens":274,"output_price_per_1m_tokens":1153,"input_price":274,"output_price":1153,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":785,"benchmark_gpqa_reasoning":1607,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1608,"benchmark_math_hard_reasoning":1609,"benchmark_aime_reasoning":905,"benchmark_coding_reasoning":1610,"benchmark_intelligence_reasoning":1611,"benchmark_math_reasoning":160},"z-ai:glm-4.5","z-ai-glm-4.5","GLM 4.5","Z-ai GLM 4.5",1753471347,78.2,73.8,97.9,26.3,26.4,{"provider_id":1613,"slug":1614,"model_name":1615,"provider_name":375,"provider":1616,"is_open":37,"author_country":12,"release_date":1617,"release_month":1469,"context_length":1477,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":50,"input_price":404,"output_price":50,"benchmark_mmlu_pro":1255,"benchmark_gpqa":1021,"benchmark_aider":12,"benchmark_livecodebench":130,"benchmark_math_hard":1618,"benchmark_aime":1200,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-30b-a3b-instruct-2507","qwen-qwen3-30b-a3b-instruct-2507","Qwen3 30B A3B Instruct 2507","Qwen Qwen3 30B A3B Instruct 2507",1753806965,97.5,{"provider_id":1620,"slug":1621,"model_name":1622,"provider_name":375,"provider":1623,"is_open":37,"author_country":12,"release_date":1624,"release_month":1469,"context_length":1625,"input_price_per_1m_tokens":1509,"output_price_per_1m_tokens":1626,"input_price":1509,"output_price":1626,"benchmark_mmlu_pro":1627,"benchmark_gpqa":449,"benchmark_aider":12,"benchmark_livecodebench":1628,"benchmark_math_hard":973,"benchmark_aime":28,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-coder-30b-a3b-instruct","qwen-qwen3-coder-30b-a3b-instruct","Qwen3 Coder 30B A3B Instruct","Qwen Qwen3 Coder 30B A3B Instruct",1753972379,160000,0.27,70.6,40.3,{"provider_id":1630,"slug":1631,"model_name":1632,"provider_name":83,"provider":1633,"is_open":37,"author_country":12,"release_date":1634,"release_month":1635,"context_length":981,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":312,"input_price":50,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":1636,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:codestral-2508","mistral-ai-codestral-2508","Codestral 2508","Mistral AI Codestral 2508",1754079630,"2025-08",11.1,{"provider_id":1638,"slug":1639,"model_name":1640,"provider_name":138,"provider":1641,"is_open":11,"author_country":12,"release_date":1642,"release_month":1635,"context_length":142,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1351,"input_price":161,"output_price":1351,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1643,"benchmark_gpqa_reasoning":1066,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":414,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1644,"benchmark_intelligence_reasoning":1645,"benchmark_math_reasoning":887},"anthropic:claude-opus-4.1","anthropic-claude-opus-4.1","Claude Opus 4.1","Anthropic Claude Opus 4.1",1754411591,88,36.5,42,{"provider_id":1647,"slug":1648,"model_name":1649,"provider_name":9,"provider":1650,"is_open":37,"author_country":12,"release_date":1651,"release_month":1635,"context_length":287,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":495,"input_price":207,"output_price":495,"benchmark_mmlu_pro":767,"benchmark_gpqa":1652,"benchmark_aider":12,"benchmark_livecodebench":1255,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-oss-20b","openai-gpt-oss-20b","GPT-OSS-20b","OpenAI GPT-OSS-20b",1754414229,68.8,{"provider_id":1654,"slug":1655,"model_name":1656,"provider_name":9,"provider":1657,"is_open":37,"author_country":12,"release_date":1658,"release_month":1635,"context_length":287,"input_price_per_1m_tokens":1659,"output_price_per_1m_tokens":495,"input_price":1659,"output_price":495,"benchmark_mmlu_pro":1660,"benchmark_gpqa":1661,"benchmark_aider":1662,"benchmark_livecodebench":1024,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-oss-120b","openai-gpt-oss-120b","GPT-OSS-120b","OpenAI GPT-OSS-120b",1754414231,0.039,77.5,67.2,41.8,{"provider_id":1664,"slug":1665,"model_name":1666,"provider_name":9,"provider":1667,"is_open":11,"author_country":12,"release_date":1668,"release_month":1635,"context_length":1669,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":536,"input_price":299,"output_price":536,"benchmark_mmlu_pro":277,"benchmark_gpqa":959,"benchmark_aider":12,"benchmark_livecodebench":1219,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5-nano","openai-gpt-5-nano","GPT-5 Nano","OpenAI GPT-5 Nano",1754587402,400000,{"provider_id":1671,"slug":1672,"model_name":1673,"provider_name":9,"provider":1674,"is_open":11,"author_country":12,"release_date":1675,"release_month":1635,"context_length":1669,"input_price_per_1m_tokens":1676,"output_price_per_1m_tokens":61,"input_price":1676,"output_price":61,"benchmark_mmlu_pro":891,"benchmark_gpqa":1187,"benchmark_aider":12,"benchmark_livecodebench":1677,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5-mini","openai-gpt-5-mini","GPT-5 Mini","OpenAI GPT-5 Mini",1754587407,0.125,83.8,{"provider_id":1679,"slug":1680,"model_name":1681,"provider_name":9,"provider":1682,"is_open":11,"author_country":12,"release_date":1683,"release_month":1635,"context_length":1669,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"benchmark_mmlu_pro":1131,"benchmark_gpqa":1600,"benchmark_aider":1643,"benchmark_livecodebench":1684,"benchmark_math_hard":1685,"benchmark_aime":1686,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5","openai-gpt-5","GPT-5","OpenAI GPT-5",1754587413,55.8,86.1,36.7,{"provider_id":1688,"slug":1689,"model_name":1690,"provider_name":9,"provider":1691,"is_open":11,"author_country":12,"release_date":1692,"release_month":1635,"context_length":129,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5-chat","openai-gpt-5-chat","GPT-5 Chat","OpenAI GPT-5 Chat",1754587837,{"provider_id":1694,"slug":1695,"model_name":1696,"provider_name":1697,"provider":1698,"is_open":11,"author_country":12,"release_date":1699,"release_month":1635,"context_length":981,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"benchmark_mmlu_pro":1700,"benchmark_gpqa":1071,"benchmark_aider":12,"benchmark_livecodebench":1701,"benchmark_math_hard":17,"benchmark_aime":230,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"ai21:jamba-large-1.7","ai21-jamba-large-1.7","Jamba Large 1.7","Ai21","Ai21 Jamba Large 1.7",1754669020,57.7,18.1,{"provider_id":1703,"slug":1704,"model_name":1705,"provider_name":1580,"provider":1706,"is_open":37,"author_country":12,"release_date":1707,"release_month":1635,"context_length":181,"input_price_per_1m_tokens":274,"output_price_per_1m_tokens":1708,"input_price":274,"output_price":1708,"benchmark_mmlu_pro":1709,"benchmark_gpqa":1710,"benchmark_aider":12,"benchmark_livecodebench":1711,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1571,"benchmark_gpqa_reasoning":1598,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":768,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1712,"benchmark_intelligence_reasoning":1713,"benchmark_math_reasoning":1211},"z-ai:glm-4.5v","z-ai-glm-4.5v","GLM 4.5V","Z-ai GLM 4.5V",1754922288,1.8,75.1,57.3,35.2,10.9,15.1,{"provider_id":1715,"slug":1716,"model_name":1717,"provider_name":1448,"provider":1718,"is_open":37,"author_country":12,"release_date":1719,"release_month":1635,"context_length":1720,"input_price_per_1m_tokens":116,"output_price_per_1m_tokens":1721,"input_price":116,"output_price":1721,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"baidu:ernie-4.5-vl-28b-a3b","baidu-ernie-4.5-vl-28b-a3b","ERNIE 4.5 VL 28B A3B","Baidu ERNIE 4.5 VL 28B A3B",1755032836,30000,0.56,{"provider_id":1723,"slug":1724,"model_name":1725,"provider_name":1448,"provider":1726,"is_open":37,"author_country":12,"release_date":1727,"release_month":1635,"context_length":1728,"input_price_per_1m_tokens":1509,"output_price_per_1m_tokens":1250,"input_price":1509,"output_price":1250,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"baidu:ernie-4.5-21b-a3b","baidu-ernie-4.5-21b-a3b","ERNIE 4.5 21B A3B","Baidu ERNIE 4.5 21B A3B",1755034167,120000,{"provider_id":1730,"slug":1731,"model_name":1732,"provider_name":83,"provider":1733,"is_open":11,"author_country":12,"release_date":1734,"release_month":1635,"context_length":287,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"benchmark_mmlu_pro":577,"benchmark_gpqa":1735,"benchmark_aider":12,"benchmark_livecodebench":1239,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-medium-3.1","mistral-ai-mistral-medium-3.1","Mistral Medium 3.1","Mistral AI Mistral Medium 3.1",1755095639,58.8,{"provider_id":1737,"slug":1738,"model_name":1739,"provider_name":667,"provider":1740,"is_open":37,"author_country":12,"release_date":1741,"release_month":1635,"context_length":115,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":60,"input_price":273,"output_price":60,"benchmark_mmlu_pro":1742,"benchmark_gpqa":1743,"benchmark_aider":12,"benchmark_livecodebench":1700,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1744,"benchmark_gpqa_reasoning":857,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1155,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":28,"benchmark_intelligence_reasoning":906,"benchmark_math_reasoning":1745},"deepseek:deepseek-chat-v3.1","deepseek-deepseek-chat-v3.1","DeepSeek V3.1","Deepseek DeepSeek V3.1",1755779628,83.3,73.5,85.1,89.7,{"provider_id":1747,"slug":1748,"model_name":1749,"provider_name":226,"provider":1750,"is_open":37,"author_country":12,"release_date":1751,"release_month":1635,"context_length":287,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":68,"input_price":61,"output_price":68,"benchmark_mmlu_pro":555,"benchmark_gpqa":1752,"benchmark_aider":12,"benchmark_livecodebench":1206,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1753,"benchmark_gpqa_reasoning":1200,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1754,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":417,"benchmark_intelligence_reasoning":1755,"benchmark_math_reasoning":587},"nousresearch:hermes-4-405b","nousresearch-hermes-4-405b","Hermes 4 405B","Nousresearch Hermes 4 405B",1756235463,53.6,82.9,68.6,18.6,{"provider_id":1757,"slug":1758,"model_name":1759,"provider_name":226,"provider":1760,"is_open":37,"author_country":12,"release_date":1761,"release_month":1635,"context_length":287,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":536,"input_price":808,"output_price":536,"benchmark_mmlu_pro":1121,"benchmark_gpqa":413,"benchmark_aider":12,"benchmark_livecodebench":1762,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1453,"benchmark_gpqa_reasoning":1763,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1764,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1765,"benchmark_intelligence_reasoning":417,"benchmark_math_reasoning":749},"nousresearch:hermes-4-70b","nousresearch-hermes-4-70b","Hermes 4 70B","Nousresearch Hermes 4 70B",1756236182,26.9,69.9,65.3,14.4,{"provider_id":1767,"slug":1768,"model_name":1769,"provider_name":1076,"provider":1770,"is_open":11,"author_country":12,"release_date":1771,"release_month":1635,"context_length":981,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":26,"input_price":377,"output_price":26,"benchmark_mmlu_pro":1772,"benchmark_gpqa":1200,"benchmark_aider":12,"benchmark_livecodebench":1108,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xai:grok-code-fast-1","xai-grok-code-fast-1","Grok Code Fast 1","Xai Grok Code Fast 1",1756238927,79.3,{"provider_id":1774,"slug":1775,"model_name":1776,"provider_name":375,"provider":1777,"is_open":37,"author_country":12,"release_date":1778,"release_month":1635,"context_length":115,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":50,"input_price":251,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-30b-a3b-thinking-2507","qwen-qwen3-30b-a3b-thinking-2507","Qwen3 30B A3B Thinking 2507","Qwen Qwen3 30B A3B Thinking 2507",1756399192,{"provider_id":1780,"slug":1781,"model_name":1782,"provider_name":1522,"provider":1783,"is_open":37,"author_country":12,"release_date":1784,"release_month":1785,"context_length":1477,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"benchmark_mmlu_pro":984,"benchmark_gpqa":557,"benchmark_aider":12,"benchmark_livecodebench":1786,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"moonshotai:kimi-k2-0905","moonshotai-kimi-k2-0905","Kimi K2 0905 (exacto)","Moonshotai Kimi K2 0905 (exacto)",1757021147,"2025-09",61,{"provider_id":1788,"slug":1789,"model_name":1790,"provider_name":480,"provider":1791,"is_open":37,"author_country":12,"release_date":1792,"release_month":1785,"context_length":287,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":957,"input_price":208,"output_price":957,"benchmark_mmlu_pro":745,"benchmark_gpqa":915,"benchmark_aider":12,"benchmark_livecodebench":566,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1793,"benchmark_gpqa_reasoning":1794,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":902,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":427,"benchmark_intelligence_reasoning":185,"benchmark_math_reasoning":587},"nvidia:nemotron-nano-9b-v2","nvidia-nemotron-nano-9b-v2","Nemotron Nano 9B V2","Nvidia Nemotron Nano 9B V2",1757106807,74.2,57,{"provider_id":1796,"slug":1797,"model_name":1798,"provider_name":375,"provider":1799,"is_open":11,"author_country":12,"release_date":1800,"release_month":1785,"context_length":792,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":794,"input_price":793,"output_price":794,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen-plus-2025-07-28","qwen-qwen-plus-2025-07-28","Qwen Plus 0728 (thinking)","Qwen Qwen Plus 0728 (thinking)",1757347599,{"provider_id":1802,"slug":1803,"model_name":1804,"provider_name":1805,"provider":1806,"is_open":11,"author_country":12,"release_date":1807,"release_month":1785,"context_length":287,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":524,"input_price":377,"output_price":524,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"meituan:longcat-flash-chat","meituan-longcat-flash-chat","LongCat Flash Chat","Meituan","Meituan LongCat Flash Chat",1757427658,{"provider_id":1809,"slug":1810,"model_name":1811,"provider_name":375,"provider":1812,"is_open":37,"author_country":12,"release_date":1813,"release_month":1785,"context_length":1477,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":794,"input_price":404,"output_price":794,"benchmark_mmlu_pro":984,"benchmark_gpqa":1608,"benchmark_aider":12,"benchmark_livecodebench":1598,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-next-80b-a3b-instruct","qwen-qwen3-next-80b-a3b-instruct","Qwen3 Next 80B A3B Instruct","Qwen Qwen3 Next 80B A3B Instruct",1757612213,{"provider_id":1815,"slug":1816,"model_name":1817,"provider_name":375,"provider":1818,"is_open":37,"author_country":12,"release_date":1819,"release_month":1785,"context_length":129,"input_price_per_1m_tokens":1820,"output_price_per_1m_tokens":50,"input_price":1820,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-next-80b-a3b-thinking","qwen-qwen3-next-80b-a3b-thinking","Qwen3 Next 80B A3B Thinking","Qwen Qwen3 Next 80B A3B Thinking",1757612284,0.0975,{"provider_id":1822,"slug":1823,"model_name":1824,"provider_name":375,"provider":1825,"is_open":11,"author_country":12,"release_date":1826,"release_month":1785,"context_length":792,"input_price_per_1m_tokens":1827,"output_price_per_1m_tokens":1828,"input_price":1827,"output_price":1828,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-coder-flash","qwen-qwen3-coder-flash","Qwen3 Coder Flash","Qwen Qwen3 Coder Flash",1758115536,0.195,0.975,{"provider_id":1830,"slug":1831,"model_name":1832,"provider_name":1833,"provider":1834,"is_open":37,"author_country":12,"release_date":1835,"release_month":1785,"context_length":287,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":536,"input_price":404,"output_price":536,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"alibaba:tongyi-deepresearch-30b-a3b","alibaba-tongyi-deepresearch-30b-a3b","Tongyi DeepResearch 30B A3B","Alibaba","Alibaba Tongyi DeepResearch 30B A3B",1758210804,{"provider_id":1837,"slug":1838,"model_name":1839,"provider_name":1076,"provider":1840,"is_open":11,"author_country":12,"release_date":1841,"release_month":1785,"context_length":1842,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":25,"input_price":377,"output_price":25,"benchmark_mmlu_pro":1211,"benchmark_gpqa":1843,"benchmark_aider":12,"benchmark_livecodebench":360,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":889,"benchmark_gpqa_reasoning":1844,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1154,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1845,"benchmark_intelligence_reasoning":131,"benchmark_math_reasoning":1745},"xai:grok-4-fast","xai-grok-4-fast","Grok 4 Fast","Xai Grok 4 Fast",1758240090,2000000,60.6,84.7,27.4,{"provider_id":1847,"slug":1848,"model_name":1849,"provider_name":667,"provider":1850,"is_open":37,"author_country":12,"release_date":1851,"release_month":1785,"context_length":670,"input_price_per_1m_tokens":1852,"output_price_per_1m_tokens":1853,"input_price":1852,"output_price":1853,"benchmark_mmlu_pro":1375,"benchmark_gpqa":1709,"benchmark_aider":12,"benchmark_livecodebench":971,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1744,"benchmark_gpqa_reasoning":1854,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1204,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":917,"benchmark_intelligence_reasoning":1143,"benchmark_math_reasoning":1745},"deepseek:deepseek-v3.1-terminus","deepseek-deepseek-v3.1-terminus","DeepSeek V3.1 Terminus","Deepseek DeepSeek V3.1 Terminus",1758548275,0.21,0.79,79.2,{"provider_id":1856,"slug":1857,"model_name":1858,"provider_name":9,"provider":1859,"is_open":11,"author_country":12,"release_date":1860,"release_month":1785,"context_length":1669,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"benchmark_mmlu_pro":1861,"benchmark_gpqa":891,"benchmark_aider":12,"benchmark_livecodebench":1190,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5-codex","openai-gpt-5-codex","GPT-5 Codex","OpenAI GPT-5 Codex",1758643403,86.5,{"provider_id":1863,"slug":1864,"model_name":1865,"provider_name":375,"provider":1866,"is_open":37,"author_country":12,"release_date":1867,"release_month":1785,"context_length":792,"input_price_per_1m_tokens":262,"output_price_per_1m_tokens":1868,"input_price":262,"output_price":1868,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-coder-plus","qwen-qwen3-coder-plus","Qwen3 Coder Plus","Qwen Qwen3 Coder Plus",1758662707,3.25,{"provider_id":1870,"slug":1871,"model_name":1872,"provider_name":375,"provider":1873,"is_open":11,"author_country":12,"release_date":1874,"release_month":1785,"context_length":1477,"input_price_per_1m_tokens":794,"output_price_per_1m_tokens":1875,"input_price":794,"output_price":1875,"benchmark_mmlu_pro":1677,"benchmark_gpqa":1876,"benchmark_aider":12,"benchmark_livecodebench":1877,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-max","qwen-qwen3-max","Qwen3 Max","Qwen Qwen3 Max",1758662808,3.9,76.4,65.1,{"provider_id":1879,"slug":1880,"model_name":1881,"provider_name":375,"provider":1882,"is_open":37,"author_country":12,"release_date":1883,"release_month":1785,"context_length":1477,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":1884,"input_price":377,"output_price":1884,"benchmark_mmlu_pro":1419,"benchmark_gpqa":982,"benchmark_aider":12,"benchmark_livecodebench":636,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-235b-a22b-instruct","qwen-qwen3-vl-235b-a22b-instruct","Qwen3 VL 235B A22B Instruct","Qwen Qwen3 VL 235B A22B Instruct",1758668687,0.88,{"provider_id":1886,"slug":1887,"model_name":1888,"provider_name":375,"provider":1889,"is_open":37,"author_country":12,"release_date":1890,"release_month":1785,"context_length":287,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":312,"input_price":793,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-235b-a22b-thinking","qwen-qwen3-vl-235b-a22b-thinking","Qwen3 VL 235B A22B Thinking","Qwen Qwen3 VL 235B A22B Thinking",1758668690,{"provider_id":1892,"slug":1893,"model_name":1894,"provider_name":248,"provider":1895,"is_open":11,"author_country":12,"release_date":1896,"release_month":1785,"context_length":856,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"benchmark_mmlu_pro":1353,"benchmark_gpqa":1877,"benchmark_aider":12,"benchmark_livecodebench":1897,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1167,"benchmark_gpqa_reasoning":1898,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1652,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1701,"benchmark_intelligence_reasoning":1899,"benchmark_math_reasoning":749},"google:gemini-2.5-flash-lite-preview-09-2025","google-gemini-2.5-flash-lite-preview-09-2025","Gemini 2.5 Flash Lite Preview 09-2025","Google Gemini 2.5 Flash Lite Preview 09-2025",1758819686,64.1,70.9,21.6,{"provider_id":1901,"slug":1902,"model_name":1903,"provider_name":1904,"provider":1905,"is_open":11,"author_country":12,"release_date":1906,"release_month":1785,"context_length":981,"input_price_per_1m_tokens":370,"output_price_per_1m_tokens":144,"input_price":370,"output_price":144,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"relace:relace-apply-3","relace-relace-apply-3","Relace Apply 3","Relace","Relace Relace Apply 3",1758891572,{"provider_id":1908,"slug":1909,"model_name":1910,"provider_name":455,"provider":1911,"is_open":37,"author_country":12,"release_date":1912,"release_month":1785,"context_length":287,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":25,"input_price":50,"output_price":25,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"thedrummer:cydonia-24b-v4.1","thedrummer-cydonia-24b-v4.1","Cydonia 24B V4.1","Thedrummer Cydonia 24B V4.1",1758931878,{"provider_id":1914,"slug":1915,"model_name":1916,"provider_name":667,"provider":1917,"is_open":37,"author_country":12,"release_date":1918,"release_month":1785,"context_length":670,"input_price_per_1m_tokens":1626,"output_price_per_1m_tokens":1919,"input_price":1626,"output_price":1919,"benchmark_mmlu_pro":1375,"benchmark_gpqa":1608,"benchmark_aider":1793,"benchmark_livecodebench":1920,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":889,"benchmark_gpqa_reasoning":1921,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":279,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1922,"benchmark_intelligence_reasoning":1923,"benchmark_math_reasoning":1500},"deepseek:deepseek-v3.2-exp","deepseek-deepseek-v3.2-exp","DeepSeek V3.2 Exp","Deepseek DeepSeek V3.2 Exp",1759150481,0.41,55.4,79.7,33.3,32.9,{"provider_id":1925,"slug":1926,"model_name":1927,"provider_name":138,"provider":1928,"is_open":11,"author_country":12,"release_date":1929,"release_month":1785,"context_length":792,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":871,"benchmark_gpqa":1200,"benchmark_aider":12,"benchmark_livecodebench":623,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1930,"benchmark_gpqa_reasoning":1931,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":569,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1932,"benchmark_intelligence_reasoning":1124,"benchmark_math_reasoning":1643},"anthropic:claude-sonnet-4.5","anthropic-claude-sonnet-4.5","Claude Sonnet 4.5","Anthropic Claude Sonnet 4.5",1759161676,87.5,83.4,38.6,{"provider_id":1934,"slug":1935,"model_name":1936,"provider_name":1580,"provider":1937,"is_open":37,"author_country":12,"release_date":1938,"release_month":1785,"context_length":1939,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":1940,"input_price":324,"output_price":1940,"benchmark_mmlu_pro":1155,"benchmark_gpqa":1941,"benchmark_aider":12,"benchmark_livecodebench":1942,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1753,"benchmark_gpqa_reasoning":1943,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1417,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":556,"benchmark_intelligence_reasoning":1944,"benchmark_math_reasoning":871},"z-ai:glm-4.6","z-ai-glm-4.6","GLM 4.6","Z-ai GLM 4.6",1759235576,204800,1.7,63.2,56.1,78,32.5,{"provider_id":1946,"slug":1947,"model_name":1948,"provider_name":9,"provider":1949,"is_open":11,"author_country":12,"release_date":1950,"release_month":1951,"context_length":1669,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1952,"input_price":161,"output_price":1952,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5-pro","openai-gpt-5-pro","GPT-5 Pro","OpenAI GPT-5 Pro",1759776663,"2025-10",120,{"provider_id":1954,"slug":1955,"model_name":1956,"provider_name":375,"provider":1957,"is_open":37,"author_country":12,"release_date":1958,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":819,"input_price":808,"output_price":819,"benchmark_mmlu_pro":1876,"benchmark_gpqa":1417,"benchmark_aider":12,"benchmark_livecodebench":300,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-30b-a3b-instruct","qwen-qwen3-vl-30b-a3b-instruct","Qwen3 VL 30B A3B Instruct","Qwen Qwen3 VL 30B A3B Instruct",1759794476,{"provider_id":1960,"slug":1961,"model_name":1962,"provider_name":375,"provider":1963,"is_open":37,"author_country":12,"release_date":1964,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":274,"input_price":808,"output_price":274,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-30b-a3b-thinking","qwen-qwen3-vl-30b-a3b-thinking","Qwen3 VL 30B A3B Thinking","Qwen Qwen3 VL 30B A3B Thinking",1759794479,{"provider_id":1966,"slug":1967,"model_name":1968,"provider_name":248,"provider":1969,"is_open":11,"author_country":12,"release_date":1970,"release_month":1951,"context_length":115,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":220,"input_price":50,"output_price":220,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-2.5-flash-image","google-gemini-2.5-flash-image","Gemini 2.5 Flash Image (Nano Banana)","Google Gemini 2.5 Flash Image (Nano Banana)",1759870431,{"provider_id":1972,"slug":1973,"model_name":1974,"provider_name":1448,"provider":1975,"is_open":37,"author_country":12,"release_date":1976,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":1509,"output_price_per_1m_tokens":1250,"input_price":1509,"output_price":1250,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"baidu:ernie-4.5-21b-a3b-thinking","baidu-ernie-4.5-21b-a3b-thinking","ERNIE 4.5 21B A3B Thinking","Baidu ERNIE 4.5 21B A3B Thinking",1760048887,{"provider_id":1978,"slug":1979,"model_name":1980,"provider_name":480,"provider":1981,"is_open":11,"author_country":12,"release_date":1982,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"benchmark_mmlu_pro":1983,"benchmark_gpqa":1984,"benchmark_aider":12,"benchmark_livecodebench":936,"benchmark_math_hard":771,"benchmark_aime":961,"benchmark_mmlu_pro_reasoning":1985,"benchmark_gpqa_reasoning":767,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":160,"benchmark_math_hard_reasoning":1367,"benchmark_aime_reasoning":871,"benchmark_coding_reasoning":1986,"benchmark_intelligence_reasoning":1987,"benchmark_math_reasoning":557},"nvidia:llama-3.3-nemotron-super-49b-v1.5","nvidia-llama-3.3-nemotron-super-49b-v1.5","Llama 3.3 Nemotron Super 49B V1.5","Nvidia Llama 3.3 Nemotron Super 49B V1.5",1760101395,69.2,48.1,81.4,15.2,18.7,{"provider_id":1989,"slug":1990,"model_name":1991,"provider_name":9,"provider":1992,"is_open":11,"author_country":12,"release_date":1993,"release_month":1951,"context_length":142,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o4-mini-deep-research","openai-o4-mini-deep-research","o4 Mini Deep Research","OpenAI o4 Mini Deep Research",1760129642,{"provider_id":1995,"slug":1996,"model_name":1997,"provider_name":9,"provider":1998,"is_open":11,"author_country":12,"release_date":1999,"release_month":1951,"context_length":142,"input_price_per_1m_tokens":156,"output_price_per_1m_tokens":1201,"input_price":156,"output_price":1201,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:o3-deep-research","openai-o3-deep-research","o3 Deep Research","OpenAI o3 Deep Research",1760129661,{"provider_id":2001,"slug":2002,"model_name":2003,"provider_name":375,"provider":2004,"is_open":37,"author_country":12,"release_date":2005,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":377,"input_price":251,"output_price":377,"benchmark_mmlu_pro":1754,"benchmark_gpqa":2006,"benchmark_aider":12,"benchmark_livecodebench":184,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-8b-instruct","qwen-qwen3-vl-8b-instruct","Qwen3 VL 8B Instruct","Qwen Qwen3 VL 8B Instruct",1760463308,42.7,{"provider_id":2008,"slug":2009,"model_name":2010,"provider_name":375,"provider":2011,"is_open":11,"author_country":12,"release_date":2012,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":2013,"output_price_per_1m_tokens":2014,"input_price":2013,"output_price":2014,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-8b-thinking","qwen-qwen3-vl-8b-thinking","Qwen3 VL 8B Thinking","Qwen Qwen3 VL 8B Thinking",1760463746,0.117,1.365,{"provider_id":2016,"slug":2017,"model_name":2018,"provider_name":138,"provider":2019,"is_open":11,"author_country":12,"release_date":2020,"release_month":1951,"context_length":142,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":505,"input_price":61,"output_price":505,"benchmark_mmlu_pro":1398,"benchmark_gpqa":2021,"benchmark_aider":12,"benchmark_livecodebench":1012,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1322,"benchmark_gpqa_reasoning":1661,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":746,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1111,"benchmark_intelligence_reasoning":2022,"benchmark_math_reasoning":891},"anthropic:claude-haiku-4.5","anthropic-claude-haiku-4.5","Claude Haiku 4.5","Anthropic Claude Haiku 4.5",1760547638,64.6,37.1,{"provider_id":2024,"slug":2025,"model_name":2026,"provider_name":2027,"provider":2028,"is_open":11,"author_country":12,"release_date":2029,"release_month":1951,"context_length":311,"input_price_per_1m_tokens":2030,"output_price_per_1m_tokens":86,"input_price":2030,"output_price":86,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"ibm-granite:granite-4.0-h-micro","ibm-granite-granite-4.0-h-micro","Granite 4.0 Micro","Ibm-granite","Ibm-granite Granite 4.0 Micro",1760927695,0.017,{"provider_id":2032,"slug":2033,"model_name":2034,"provider_name":2035,"provider":2036,"is_open":37,"author_country":12,"release_date":2037,"release_month":1951,"context_length":115,"input_price_per_1m_tokens":2038,"output_price_per_1m_tokens":288,"input_price":2038,"output_price":288,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"liquid:lfm-2.2-6b","liquid-lfm-2.2-6b","LiquidAI/LFM2-2.6B","Liquid","Liquid LiquidAI/LFM2-2.6B",1760970889,0.01,{"provider_id":2040,"slug":2041,"model_name":2042,"provider_name":2035,"provider":2043,"is_open":37,"author_country":12,"release_date":2044,"release_month":1951,"context_length":115,"input_price_per_1m_tokens":2038,"output_price_per_1m_tokens":288,"input_price":2038,"output_price":288,"benchmark_mmlu_pro":567,"benchmark_gpqa":2045,"benchmark_aider":12,"benchmark_livecodebench":1713,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"liquid:lfm2-8b-a1b","liquid-lfm2-8b-a1b","LiquidAI/LFM2-8B-A1B","Liquid LiquidAI/LFM2-8B-A1B",1760970984,34.4,{"provider_id":2047,"slug":2048,"model_name":2049,"provider_name":375,"provider":2050,"is_open":11,"author_country":12,"release_date":2051,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":2052,"output_price_per_1m_tokens":2053,"input_price":2052,"output_price":2053,"benchmark_mmlu_pro":766,"benchmark_gpqa":1067,"benchmark_aider":12,"benchmark_livecodebench":2054,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-vl-32b-instruct","qwen-qwen3-vl-32b-instruct","Qwen3 VL 32B Instruct","Qwen Qwen3 VL 32B Instruct",1761231332,0.104,0.416,51.4,{"provider_id":2056,"slug":2057,"model_name":2058,"provider_name":696,"provider":2059,"is_open":37,"author_country":12,"release_date":2060,"release_month":1951,"context_length":2061,"input_price_per_1m_tokens":2062,"output_price_per_1m_tokens":61,"input_price":2062,"output_price":61,"benchmark_mmlu_pro":1192,"benchmark_gpqa":1255,"benchmark_aider":12,"benchmark_livecodebench":2063,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-m2","minimax-minimax-m2","MiniMax M2","Minimax MiniMax M2",1761252093,196608,0.255,82.6,{"provider_id":2065,"slug":2066,"model_name":2067,"provider_name":480,"provider":2068,"is_open":37,"author_country":12,"release_date":2069,"release_month":1951,"context_length":287,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"benchmark_mmlu_pro":329,"benchmark_gpqa":2070,"benchmark_aider":12,"benchmark_livecodebench":2071,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1551,"benchmark_gpqa_reasoning":2072,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":157,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2073,"benchmark_intelligence_reasoning":2074,"benchmark_math_reasoning":1351},"nvidia:nemotron-nano-12b-v2-vl","nvidia-nemotron-nano-12b-v2-vl","Nemotron Nano 12B 2 VL","Nvidia Nemotron Nano 12B 2 VL",1761675565,43.9,34.5,57.2,11.8,14.9,{"provider_id":2076,"slug":2077,"model_name":2078,"provider_name":83,"provider":2079,"is_open":37,"author_country":12,"release_date":2080,"release_month":1951,"context_length":2081,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":50,"input_price":495,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:voxtral-small-24b-2507","mistral-ai-voxtral-small-24b-2507","Voxtral Small 24B 2507","Mistral AI Voxtral Small 24B 2507",1761835144,32000,{"provider_id":2083,"slug":2084,"model_name":2085,"provider_name":730,"provider":2086,"is_open":11,"author_country":12,"release_date":2087,"release_month":1951,"context_length":142,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"perplexity:sonar-pro-search","perplexity-sonar-pro-search","Sonar Pro Search","Perplexity Sonar Pro Search",1761854366,{"provider_id":2089,"slug":2090,"model_name":2091,"provider_name":595,"provider":2092,"is_open":11,"author_country":12,"release_date":2093,"release_month":1951,"context_length":792,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":2094,"input_price":220,"output_price":2094,"benchmark_mmlu_pro":487,"benchmark_gpqa":2095,"benchmark_aider":12,"benchmark_livecodebench":2096,"benchmark_math_hard":2097,"benchmark_aime":2098,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"amazon:nova-premier-v1","amazon-nova-premier-v1","Nova Premier 1.0","Amazon Nova Premier 1.0",1761950332,12.5,56.9,31.7,83.9,17,{"provider_id":2100,"slug":2101,"model_name":2102,"provider_name":1522,"provider":2103,"is_open":37,"author_country":12,"release_date":2104,"release_month":2105,"context_length":287,"input_price_per_1m_tokens":2106,"output_price_per_1m_tokens":78,"input_price":2106,"output_price":78,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"moonshotai:kimi-k2-thinking","moonshotai-kimi-k2-thinking","Kimi K2 Thinking","Moonshotai Kimi K2 Thinking",1762440622,"2025-11",0.47,{"provider_id":2108,"slug":2109,"model_name":2110,"provider_name":2111,"provider":2112,"is_open":37,"author_country":12,"release_date":2113,"release_month":2105,"context_length":981,"input_price_per_1m_tokens":2114,"output_price_per_1m_tokens":2115,"input_price":2114,"output_price":2115,"benchmark_mmlu_pro":1166,"benchmark_gpqa":1876,"benchmark_aider":12,"benchmark_livecodebench":653,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"kwaipilot:kat-coder-pro","kwaipilot-kat-coder-pro","KAT-Coder-Pro V1","Kwaipilot","Kwaipilot KAT-Coder-Pro V1",1762745912,0.207,0.828,{"provider_id":2117,"slug":2118,"model_name":2119,"provider_name":9,"provider":2120,"is_open":11,"author_country":12,"release_date":2121,"release_month":2105,"context_length":1669,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":78,"input_price":143,"output_price":78,"benchmark_mmlu_pro":1192,"benchmark_gpqa":1166,"benchmark_aider":12,"benchmark_livecodebench":1375,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.1-codex-mini","openai-gpt-5.1-codex-mini","GPT-5.1-Codex-Mini","OpenAI GPT-5.1-Codex-Mini",1763057820,{"provider_id":2123,"slug":2124,"model_name":2125,"provider_name":9,"provider":2126,"is_open":11,"author_country":12,"release_date":2127,"release_month":2105,"context_length":1669,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"benchmark_mmlu_pro":871,"benchmark_gpqa":871,"benchmark_aider":12,"benchmark_livecodebench":1366,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.1-codex","openai-gpt-5.1-codex","GPT-5.1-Codex","OpenAI GPT-5.1-Codex",1763060298,{"provider_id":2129,"slug":2130,"model_name":2131,"provider_name":9,"provider":2132,"is_open":11,"author_country":12,"release_date":2133,"release_month":2105,"context_length":129,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.1-chat","openai-gpt-5.1-chat","GPT-5.1 Chat","OpenAI GPT-5.1 Chat",1763060302,{"provider_id":2135,"slug":2136,"model_name":2137,"provider_name":9,"provider":2138,"is_open":11,"author_country":12,"release_date":2139,"release_month":2105,"context_length":1669,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"benchmark_mmlu_pro":1407,"benchmark_gpqa":1233,"benchmark_aider":12,"benchmark_livecodebench":2140,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.1","openai-gpt-5.1","GPT-5.1","OpenAI GPT-5.1",1763060305,49.4,{"provider_id":2142,"slug":2143,"model_name":2144,"provider_name":2145,"provider":2146,"is_open":37,"author_country":12,"release_date":2147,"release_month":2105,"context_length":129,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":312,"input_price":312,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepcogito:cogito-v2.1-671b","deepcogito-cogito-v2.1-671b","Cogito v2.1 671B","Deepcogito","Deepcogito Cogito v2.1 671B",1763071233,{"provider_id":2149,"slug":2150,"model_name":2151,"provider_name":248,"provider":2152,"is_open":11,"author_country":12,"release_date":2153,"release_month":2105,"context_length":856,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":558,"input_price":78,"output_price":558,"benchmark_mmlu_pro":2154,"benchmark_gpqa":2155,"benchmark_aider":12,"benchmark_livecodebench":2156,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-3-pro-preview","google-gemini-3-pro-preview","Gemini 3 Pro Preview","Google Gemini 3 Pro Preview",1763474668,89.8,90.8,91.7,{"provider_id":2158,"slug":2159,"model_name":2160,"provider_name":1076,"provider":2161,"is_open":11,"author_country":12,"release_date":2162,"release_month":2105,"context_length":1842,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":25,"input_price":377,"output_price":25,"benchmark_mmlu_pro":1237,"benchmark_gpqa":2163,"benchmark_aider":12,"benchmark_livecodebench":2164,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":2165,"benchmark_gpqa_reasoning":994,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1313,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2166,"benchmark_intelligence_reasoning":1932,"benchmark_math_reasoning":973},"xai:grok-4.1-fast","xai-grok-4.1-fast","Grok 4.1 Fast","Xai Grok 4.1 Fast",1763587502,63.7,39.9,85.4,30.9,{"provider_id":2168,"slug":2169,"model_name":2170,"provider_name":248,"provider":2171,"is_open":11,"author_country":12,"release_date":2172,"release_month":2105,"context_length":181,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":558,"input_price":78,"output_price":558,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-3-pro-image-preview","google-gemini-3-pro-image-preview","Nano Banana Pro (Gemini 3 Pro Image Preview)","Google Nano Banana Pro (Gemini 3 Pro Image Preview)",1763653797,{"provider_id":2174,"slug":2175,"model_name":2176,"provider_name":1009,"provider":2177,"is_open":37,"author_country":12,"release_date":2178,"release_month":2105,"context_length":181,"input_price_per_1m_tokens":411,"output_price_per_1m_tokens":377,"input_price":411,"output_price":377,"benchmark_mmlu_pro":1342,"benchmark_gpqa":449,"benchmark_aider":12,"benchmark_livecodebench":712,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:olmo-3-7b-think","allenai-olmo-3-7b-think","Olmo 3 7B Think","Allenai Olmo 3 7B Think",1763758270,{"provider_id":2180,"slug":2181,"model_name":2182,"provider_name":1009,"provider":2183,"is_open":37,"author_country":12,"release_date":2184,"release_month":2105,"context_length":181,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":377,"input_price":495,"output_price":377,"benchmark_mmlu_pro":1270,"benchmark_gpqa":1201,"benchmark_aider":12,"benchmark_livecodebench":723,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:olmo-3-7b-instruct","allenai-olmo-3-7b-instruct","Olmo 3 7B Instruct","Allenai Olmo 3 7B Instruct",1763758273,{"provider_id":2186,"slug":2187,"model_name":2188,"provider_name":1009,"provider":2189,"is_open":37,"author_country":12,"release_date":2190,"release_month":2105,"context_length":181,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":25,"input_price":273,"output_price":25,"benchmark_mmlu_pro":1551,"benchmark_gpqa":1786,"benchmark_aider":12,"benchmark_livecodebench":1661,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:olmo-3-32b-think","allenai-olmo-3-32b-think","Olmo 3 32B Think","Allenai Olmo 3 32B Think",1763758276,{"provider_id":2192,"slug":2193,"model_name":2194,"provider_name":138,"provider":2195,"is_open":11,"author_country":12,"release_date":2196,"release_month":2105,"context_length":142,"input_price_per_1m_tokens":505,"output_price_per_1m_tokens":174,"input_price":505,"output_price":174,"benchmark_mmlu_pro":1070,"benchmark_gpqa":690,"benchmark_aider":12,"benchmark_livecodebench":1608,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":2197,"benchmark_gpqa_reasoning":1499,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1221,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2198,"benchmark_intelligence_reasoning":2199,"benchmark_math_reasoning":1135},"anthropic:claude-opus-4.5","anthropic-claude-opus-4.5","Claude Opus 4.5","Anthropic Claude Opus 4.5",1764010580,89.5,47.8,49.7,{"provider_id":2201,"slug":2202,"model_name":2203,"provider_name":2204,"provider":2205,"is_open":37,"author_country":12,"release_date":2206,"release_month":2105,"context_length":287,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":700,"input_price":377,"output_price":700,"benchmark_mmlu_pro":1313,"benchmark_gpqa":2207,"benchmark_aider":12,"benchmark_livecodebench":1255,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"prime-intellect:intellect-3","prime-intellect-intellect-3","INTELLECT-3","Prime-intellect","Prime-intellect INTELLECT-3",1764212534,76.1,{"provider_id":2209,"slug":2210,"model_name":2211,"provider_name":667,"provider":2212,"is_open":37,"author_country":12,"release_date":2213,"release_month":2214,"context_length":670,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":2215,"input_price":793,"output_price":2215,"benchmark_mmlu_pro":891,"benchmark_gpqa":1709,"benchmark_aider":12,"benchmark_livecodebench":1553,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1406,"benchmark_gpqa_reasoning":1190,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":1406,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1686,"benchmark_intelligence_reasoning":554,"benchmark_math_reasoning":2216},"deepseek:deepseek-v3.2","deepseek-deepseek-v3.2","DeepSeek V3.2","Deepseek DeepSeek V3.2",1764594642,"2025-12",0.38,92,{"provider_id":2218,"slug":2219,"model_name":2220,"provider_name":667,"provider":2221,"is_open":37,"author_country":12,"release_date":2222,"release_month":2214,"context_length":670,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":182,"input_price":536,"output_price":182,"benchmark_mmlu_pro":1253,"benchmark_gpqa":1221,"benchmark_aider":12,"benchmark_livecodebench":2223,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"deepseek:deepseek-v3.2-speciale","deepseek-deepseek-v3.2-speciale","DeepSeek V3.2 Speciale","Deepseek DeepSeek V3.2 Speciale",1764594837,89.6,{"provider_id":2225,"slug":2226,"model_name":2227,"provider_name":1284,"provider":2228,"is_open":37,"author_country":12,"release_date":2229,"release_month":2214,"context_length":287,"input_price_per_1m_tokens":2230,"output_price_per_1m_tokens":273,"input_price":2230,"output_price":273,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"arcee-ai:trinity-mini","arcee-ai-trinity-mini","Trinity Mini","Arcee AI Trinity Mini",1764601720,0.045,{"provider_id":2232,"slug":2233,"model_name":2234,"provider_name":83,"provider":2235,"is_open":37,"author_country":12,"release_date":2236,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":26,"input_price":25,"output_price":26,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-large-2512","mistral-ai-mistral-large-2512","Mistral Large 3 2512","Mistral AI Mistral Large 3 2512",1764624472,{"provider_id":2238,"slug":2239,"model_name":2240,"provider_name":83,"provider":2241,"is_open":37,"author_country":12,"release_date":2242,"release_month":2214,"context_length":287,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":495,"input_price":495,"output_price":495,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:ministral-3b-2512","mistral-ai-ministral-3b-2512","Ministral 3 3B 2512","Mistral AI Ministral 3 3B 2512",1764681560,{"provider_id":2244,"slug":2245,"model_name":2246,"provider_name":83,"provider":2247,"is_open":37,"author_country":12,"release_date":2248,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":273,"input_price":273,"output_price":273,"benchmark_mmlu_pro":2249,"benchmark_gpqa":735,"benchmark_aider":12,"benchmark_livecodebench":1203,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:ministral-8b-2512","mistral-ai-ministral-8b-2512","Ministral 3 8B 2512","Mistral AI Ministral 3 8B 2512",1764681654,64.2,{"provider_id":2251,"slug":2252,"model_name":2253,"provider_name":83,"provider":2254,"is_open":11,"author_country":12,"release_date":2255,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"benchmark_mmlu_pro":1528,"benchmark_gpqa":2072,"benchmark_aider":12,"benchmark_livecodebench":131,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:ministral-14b-2512","mistral-ai-ministral-14b-2512","Ministral 3 14B 2512","Mistral AI Ministral 3 14B 2512",1764681735,{"provider_id":2257,"slug":2258,"model_name":2259,"provider_name":595,"provider":2260,"is_open":11,"author_country":12,"release_date":2261,"release_month":2214,"context_length":792,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":220,"input_price":50,"output_price":220,"benchmark_mmlu_pro":1237,"benchmark_gpqa":2262,"benchmark_aider":12,"benchmark_livecodebench":2263,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"amazon:nova-2-lite-v1","amazon-nova-2-lite-v1","Nova 2 Lite","Amazon Nova 2 Lite",1764696672,60.3,34.6,{"provider_id":2265,"slug":2266,"model_name":2267,"provider_name":9,"provider":2268,"is_open":11,"author_country":12,"release_date":2269,"release_month":2214,"context_length":1669,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.1-codex-max","openai-gpt-5.1-codex-max","GPT-5.1-Codex-Max","OpenAI GPT-5.1-Codex-Max",1764878934,{"provider_id":2271,"slug":2272,"model_name":2273,"provider_name":2274,"provider":2275,"is_open":37,"author_country":12,"release_date":2276,"release_month":2214,"context_length":115,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":273,"input_price":273,"output_price":273,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"essential-ai:rnj-1-instruct","essential-ai-rnj-1-instruct","Rnj 1 Instruct","Essential AI","Essential AI Rnj 1 Instruct",1765094847,{"provider_id":2278,"slug":2279,"model_name":2280,"provider_name":2281,"provider":2282,"is_open":11,"author_country":12,"release_date":2283,"release_month":2214,"context_length":287,"input_price_per_1m_tokens":2284,"output_price_per_1m_tokens":25,"input_price":2284,"output_price":25,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"nex-agi:deepseek-v3.1-nex-n1","nex-agi-deepseek-v3.1-nex-n1","DeepSeek V3.1 Nex N1","Nex-AGI","Nex-AGI DeepSeek V3.1 Nex N1",1765204393,0.135,{"provider_id":2286,"slug":2287,"model_name":2288,"provider_name":1580,"provider":2289,"is_open":37,"author_country":12,"release_date":2290,"release_month":2214,"context_length":287,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":312,"input_price":50,"output_price":312,"benchmark_mmlu_pro":1040,"benchmark_gpqa":2291,"benchmark_aider":12,"benchmark_livecodebench":2292,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":2293,"benchmark_gpqa_reasoning":2294,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":417,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2295,"benchmark_intelligence_reasoning":278,"benchmark_math_reasoning":994},"z-ai:glm-4.6v","z-ai-glm-4.6v","GLM 4.6V","Z-ai GLM 4.6V",1765207462,56.6,41.1,79.9,71.9,19.7,{"provider_id":2297,"slug":2298,"model_name":2299,"provider_name":1904,"provider":2300,"is_open":11,"author_country":12,"release_date":2301,"release_month":2214,"context_length":981,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":68,"input_price":61,"output_price":68,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"relace:relace-search","relace-relace-search","Relace Search","Relace Relace Search",1765213560,{"provider_id":2303,"slug":2304,"model_name":2305,"provider_name":83,"provider":2306,"is_open":37,"author_country":12,"release_date":2307,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":312,"input_price":536,"output_price":312,"benchmark_mmlu_pro":781,"benchmark_gpqa":636,"benchmark_aider":12,"benchmark_livecodebench":2308,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:devstral-2512","mistral-ai-devstral-2512","Devstral 2 2512","Mistral AI Devstral 2 2512",1765285419,44.8,{"provider_id":2310,"slug":2311,"model_name":2312,"provider_name":9,"provider":2313,"is_open":11,"author_country":12,"release_date":2314,"release_month":2214,"context_length":1669,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"benchmark_mmlu_pro":1985,"benchmark_gpqa":982,"benchmark_aider":12,"benchmark_livecodebench":958,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.2","openai-gpt-5.2","GPT-5.2","OpenAI GPT-5.2",1765389775,1.75,{"provider_id":2317,"slug":2318,"model_name":2319,"provider_name":9,"provider":2320,"is_open":11,"author_country":12,"release_date":2321,"release_month":2214,"context_length":1669,"input_price_per_1m_tokens":2322,"output_price_per_1m_tokens":1190,"input_price":2322,"output_price":1190,"benchmark_mmlu_pro":2323,"benchmark_gpqa":1169,"benchmark_aider":12,"benchmark_livecodebench":1070,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.2-pro","openai-gpt-5.2-pro","GPT-5.2 Pro","OpenAI GPT-5.2 Pro",1765389780,10.5,87.4,{"provider_id":2325,"slug":2326,"model_name":2327,"provider_name":9,"provider":2328,"is_open":11,"author_country":12,"release_date":2329,"release_month":2214,"context_length":129,"input_price_per_1m_tokens":2330,"output_price_per_1m_tokens":570,"input_price":2330,"output_price":570,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.2-chat","openai-gpt-5.2-chat","GPT-5.2 Chat","OpenAI GPT-5.2 Chat",1765389783,0.875,{"provider_id":2332,"slug":2333,"model_name":2334,"provider_name":480,"provider":2335,"is_open":37,"author_country":12,"release_date":2336,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"benchmark_mmlu_pro":29,"benchmark_gpqa":2164,"benchmark_aider":12,"benchmark_livecodebench":2337,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":2338,"benchmark_gpqa_reasoning":1356,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":2339,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1243,"benchmark_intelligence_reasoning":1236,"benchmark_math_reasoning":918},"nvidia:nemotron-3-nano-30b-a3b","nvidia-nemotron-3-nano-30b-a3b","Nemotron 3 Nano 30B A3B","Nvidia Nemotron 3 Nano 30B A3B",1765731275,36,79.4,74.1,{"provider_id":2341,"slug":2342,"model_name":2343,"provider_name":2344,"provider":2345,"is_open":37,"author_country":12,"release_date":2346,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":744,"input_price":404,"output_price":744,"benchmark_mmlu_pro":221,"benchmark_gpqa":888,"benchmark_aider":12,"benchmark_livecodebench":722,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":1268,"benchmark_gpqa_reasoning":2347,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":2348,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2349,"benchmark_intelligence_reasoning":2350,"benchmark_math_reasoning":2351},"xiaomi:mimo-v2-flash","xiaomi-mimo-v2-flash","MiMo-V2-Flash","Xiaomi","Xiaomi MiMo-V2-Flash",1765731308,84.6,86.8,31.8,39.2,96.3,{"provider_id":2353,"slug":2354,"model_name":2355,"provider_name":1009,"provider":2356,"is_open":37,"author_country":12,"release_date":2357,"release_month":2214,"context_length":181,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":25,"input_price":273,"output_price":25,"benchmark_mmlu_pro":1224,"benchmark_gpqa":1526,"benchmark_aider":12,"benchmark_livecodebench":1417,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:olmo-3.1-32b-think","allenai-olmo-3.1-32b-think","Olmo 3.1 32B Think","Allenai Olmo 3.1 32B Think",1765907719,{"provider_id":2359,"slug":2360,"model_name":2361,"provider_name":83,"provider":2362,"is_open":37,"author_country":12,"release_date":2363,"release_month":2214,"context_length":115,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":50,"input_price":495,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"mistral-ai:mistral-small-creative","mistral-ai-mistral-small-creative","Mistral Small Creative","Mistral AI Mistral Small Creative",1765908653,{"provider_id":2365,"slug":2366,"model_name":2367,"provider_name":248,"provider":2368,"is_open":11,"author_country":12,"release_date":2369,"release_month":2214,"context_length":856,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":68,"input_price":25,"output_price":68,"benchmark_mmlu_pro":2370,"benchmark_gpqa":2371,"benchmark_aider":12,"benchmark_livecodebench":1921,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":2372,"benchmark_gpqa_reasoning":2154,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":2155,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":276,"benchmark_intelligence_reasoning":446,"benchmark_math_reasoning":655},"google:gemini-3-flash-preview","google-gemini-3-flash-preview","Gemini 3 Flash Preview","Google Gemini 3 Flash Preview",1765987078,88.2,81.2,89,{"provider_id":2374,"slug":2375,"model_name":2376,"provider_name":1580,"provider":2377,"is_open":37,"author_country":12,"release_date":2378,"release_month":2214,"context_length":2379,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":2315,"input_price":324,"output_price":2315,"benchmark_mmlu_pro":2338,"benchmark_gpqa":1121,"benchmark_aider":12,"benchmark_livecodebench":2380,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":2381,"benchmark_gpqa_reasoning":1156,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":2382,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2383,"benchmark_intelligence_reasoning":2384,"benchmark_math_reasoning":2385},"z-ai:glm-4.7","z-ai-glm-4.7","GLM 4.7","Z-ai GLM 4.7",1766378014,202752,56.2,85.6,89.4,36.3,42.1,95,{"provider_id":2387,"slug":2388,"model_name":2389,"provider_name":696,"provider":2390,"is_open":37,"author_country":12,"release_date":2391,"release_month":2214,"context_length":2061,"input_price_per_1m_tokens":1626,"output_price_per_1m_tokens":2392,"input_price":1626,"output_price":2392,"benchmark_mmlu_pro":1930,"benchmark_gpqa":2393,"benchmark_aider":12,"benchmark_livecodebench":690,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-m2.1","minimax-minimax-m2.1","MiniMax M2.1","Minimax MiniMax M2.1",1766454997,0.95,83,{"provider_id":2395,"slug":2396,"model_name":2397,"provider_name":2398,"provider":2399,"is_open":11,"author_country":12,"release_date":2400,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":78,"input_price":143,"output_price":78,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"bytedance-seed:seed-1.6","bytedance-seed-seed-1.6","Seed 1.6","Bytedance-seed","Bytedance-seed Seed 1.6",1766504997,{"provider_id":2402,"slug":2403,"model_name":2404,"provider_name":2398,"provider":2405,"is_open":11,"author_country":12,"release_date":2406,"release_month":2214,"context_length":1477,"input_price_per_1m_tokens":901,"output_price_per_1m_tokens":50,"input_price":901,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"bytedance-seed:seed-1.6-flash","bytedance-seed-seed-1.6-flash","Seed 1.6 Flash","Bytedance-seed Seed 1.6 Flash",1766505011,{"provider_id":2408,"slug":2409,"model_name":2410,"provider_name":1009,"provider":2411,"is_open":37,"author_country":12,"release_date":2412,"release_month":2413,"context_length":181,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":274,"input_price":377,"output_price":274,"benchmark_mmlu_pro":12,"benchmark_gpqa":2414,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:olmo-3.1-32b-instruct","allenai-olmo-3.1-32b-instruct","Olmo 3.1 32B Instruct","Allenai Olmo 3.1 32B Instruct",1767728554,"2026-01",53.9,{"provider_id":2416,"slug":2417,"model_name":2418,"provider_name":1009,"provider":2419,"is_open":37,"author_country":12,"release_date":2420,"release_month":2413,"context_length":2421,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"benchmark_mmlu_pro":12,"benchmark_gpqa":2422,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"allenai:molmo-2-8b","allenai-molmo-2-8b","Molmo 2 8B","Allenai Molmo 2 8B",1767996672,36864,42.5,{"provider_id":2424,"slug":2425,"model_name":2426,"provider_name":9,"provider":2427,"is_open":11,"author_country":12,"release_date":2428,"release_month":2413,"context_length":1669,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"benchmark_mmlu_pro":12,"benchmark_gpqa":2429,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.2-codex","openai-gpt-5.2-codex","GPT-5.2-Codex","OpenAI GPT-5.2-Codex",1768409315,89.9,{"provider_id":2431,"slug":2432,"model_name":2433,"provider_name":1580,"provider":2434,"is_open":37,"author_country":12,"release_date":2435,"release_month":2413,"context_length":2379,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":536,"input_price":41,"output_price":536,"benchmark_mmlu_pro":12,"benchmark_gpqa":1234,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":2436,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":301,"benchmark_intelligence_reasoning":2437,"benchmark_math_reasoning":12},"z-ai:glm-4.7-flash","z-ai-glm-4.7-flash","GLM-4.7-Flash","Z-ai GLM-4.7-Flash",1768833913,58.1,30.1,{"provider_id":2439,"slug":2440,"model_name":2441,"provider_name":2442,"provider":2443,"is_open":11,"author_country":12,"release_date":2444,"release_month":2413,"context_length":2445,"input_price_per_1m_tokens":274,"output_price_per_1m_tokens":565,"input_price":274,"output_price":565,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"writer:palmyra-x5","writer-palmyra-x5","Palmyra X5","Writer","Writer Palmyra X5",1769003823,1040000,{"provider_id":2447,"slug":2448,"model_name":2449,"provider_name":696,"provider":2450,"is_open":11,"author_country":12,"release_date":2451,"release_month":2413,"context_length":181,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":182,"input_price":50,"output_price":182,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-m2-her","minimax-minimax-m2-her","MiniMax M2 Her","Minimax MiniMax M2 Her",1769177239,{"provider_id":2453,"slug":2454,"model_name":2455,"provider_name":1522,"provider":2456,"is_open":37,"author_country":12,"release_date":2457,"release_month":2413,"context_length":1477,"input_price_per_1m_tokens":2458,"output_price_per_1m_tokens":2459,"input_price":2458,"output_price":2459,"benchmark_mmlu_pro":12,"benchmark_gpqa":279,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":2460,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2461,"benchmark_intelligence_reasoning":2462,"benchmark_math_reasoning":12},"moonshotai:kimi-k2.5","moonshotai-kimi-k2.5","Kimi K2.5","Moonshotai Kimi K2.5",1769487076,0.3827,1.72,87.9,39.5,46.8,{"provider_id":2464,"slug":2465,"model_name":2466,"provider_name":2467,"provider":2468,"is_open":37,"author_country":12,"release_date":2469,"release_month":2413,"context_length":981,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":50,"input_price":495,"output_price":50,"benchmark_mmlu_pro":12,"benchmark_gpqa":1376,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"stepfun-ai:step-3.5-flash","stepfun-step-3.5-flash","Step 3.5 Flash","Stepfun-ai","Stepfun-ai Step 3.5 Flash",1769728337,{"provider_id":2471,"slug":2472,"model_name":2473,"provider_name":375,"provider":2474,"is_open":37,"author_country":12,"release_date":2475,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":411,"output_price_per_1m_tokens":60,"input_price":411,"output_price":60,"benchmark_mmlu_pro":12,"benchmark_gpqa":160,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3-coder-next","qwen-qwen3-coder-next","Qwen3 Coder Next","Qwen Qwen3 Coder Next",1770164101,"2026-02",{"provider_id":2478,"slug":2479,"model_name":2480,"provider_name":138,"provider":2481,"is_open":11,"author_country":12,"release_date":2482,"release_month":2476,"context_length":792,"input_price_per_1m_tokens":505,"output_price_per_1m_tokens":174,"input_price":505,"output_price":174,"benchmark_mmlu_pro":12,"benchmark_gpqa":1190,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":2223,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":1984,"benchmark_intelligence_reasoning":2483,"benchmark_math_reasoning":12},"anthropic:claude-opus-4.6","anthropic-claude-opus-4.6","Claude Opus 4.6","Anthropic Claude Opus 4.6",1770219050,53,{"provider_id":2485,"slug":2486,"model_name":2487,"provider_name":375,"provider":2488,"is_open":11,"author_country":12,"release_date":2489,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":794,"output_price_per_1m_tokens":1875,"input_price":794,"output_price":1875,"benchmark_mmlu_pro":1525,"benchmark_gpqa":1452,"benchmark_aider":12,"benchmark_livecodebench":903,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":1685,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":315,"benchmark_intelligence_reasoning":2164,"benchmark_math_reasoning":12},"qwen:qwen3-max-thinking","qwen-qwen3-max-thinking","Qwen3 Max Thinking","Qwen Qwen3 Max Thinking",1770671901,{"provider_id":2491,"slug":2492,"model_name":2493,"provider_name":1580,"provider":2494,"is_open":37,"author_country":12,"release_date":2495,"release_month":2476,"context_length":2379,"input_price_per_1m_tokens":2496,"output_price_per_1m_tokens":363,"input_price":2496,"output_price":363,"benchmark_mmlu_pro":12,"benchmark_gpqa":1132,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":1192,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":2497,"benchmark_intelligence_reasoning":635,"benchmark_math_reasoning":12},"z-ai:glm-5","z-ai-glm-5","GLM 5","Z-ai GLM 5",1770829182,0.72,44.2,{"provider_id":2499,"slug":2500,"model_name":2501,"provider_name":696,"provider":2502,"is_open":37,"author_country":12,"release_date":2503,"release_month":2476,"context_length":2061,"input_price_per_1m_tokens":2504,"output_price_per_1m_tokens":2392,"input_price":2504,"output_price":2392,"benchmark_mmlu_pro":12,"benchmark_gpqa":1112,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-m2.5","minimax-minimax-m2.5","MiniMax M2.5","Minimax MiniMax M2.5",1770908502,0.118,{"provider_id":2506,"slug":2507,"model_name":2508,"provider_name":375,"provider":2509,"is_open":37,"author_country":12,"release_date":2510,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":312,"input_price":324,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":1685,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-397b-a17b","qwen-qwen3.5-397b-a17b","Qwen3.5 397B A17B","Qwen Qwen3.5 397B A17B",1771223018,{"provider_id":2512,"slug":2513,"model_name":2514,"provider_name":375,"provider":2515,"is_open":11,"author_country":12,"release_date":2516,"release_month":2476,"context_length":792,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":2517,"input_price":793,"output_price":2517,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-plus","qwen-qwen3.5-plus","Qwen3.5 Plus","Qwen Qwen3.5 Plus",1771229416,1.56,{"provider_id":2519,"slug":2520,"model_name":2521,"provider_name":138,"provider":2522,"is_open":11,"author_country":12,"release_date":2523,"release_month":2476,"context_length":792,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"benchmark_mmlu_pro":12,"benchmark_gpqa":1921,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"anthropic:claude-sonnet-4.6","anthropic-claude-sonnet-4.6","Claude Sonnet 4.6","Anthropic Claude Sonnet 4.6",1771342990,{"provider_id":2525,"slug":2526,"model_name":2527,"provider_name":248,"provider":2528,"is_open":11,"author_country":12,"release_date":2529,"release_month":2476,"context_length":856,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":558,"input_price":78,"output_price":558,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-3.1-pro-preview","google-gemini-3.1-pro-preview","Gemini 3.1 Pro Preview","Google Gemini 3.1 Pro Preview",1771509627,{"provider_id":2531,"slug":2532,"model_name":2533,"provider_name":825,"provider":2534,"is_open":11,"author_country":12,"release_date":2535,"release_month":2476,"context_length":287,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":828,"input_price":524,"output_price":828,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"aion-labs:aion-2.0","aion-labs-aion-2.0","Aion 2.0","Aion Labs Aion 2.0",1771881306,{"provider_id":2537,"slug":2538,"model_name":2539,"provider_name":9,"provider":2540,"is_open":11,"author_country":12,"release_date":2541,"release_month":2476,"context_length":1669,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"benchmark_mmlu_pro":12,"benchmark_gpqa":2542,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.3-codex","openai-gpt-5.3-codex","GPT-5.3 Codex","OpenAI GPT-5.3 Codex",1771959164,91.5,{"provider_id":2544,"slug":2545,"model_name":2546,"provider_name":248,"provider":2547,"is_open":11,"author_country":12,"release_date":2548,"release_month":2476,"context_length":856,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":558,"input_price":78,"output_price":558,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-3.1-pro-preview-customtools","google-gemini-3.1-pro-preview-customtools","Gemini 3.1 Pro Preview Custom Tools","Google Gemini 3.1 Pro Preview Custom Tools",1772045923,{"provider_id":2550,"slug":2551,"model_name":2552,"provider_name":2035,"provider":2553,"is_open":37,"author_country":12,"release_date":2554,"release_month":2476,"context_length":115,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":411,"input_price":207,"output_price":411,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"liquid:lfm-2-24b-a2b","liquid-lfm-2-24b-a2b","LFM2-24B-A2B","Liquid LFM2-24B-A2B",1772048711,{"provider_id":2556,"slug":2557,"model_name":2558,"provider_name":375,"provider":2559,"is_open":11,"author_country":12,"release_date":2560,"release_month":2476,"context_length":792,"input_price_per_1m_tokens":687,"output_price_per_1m_tokens":793,"input_price":687,"output_price":793,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-flash","qwen-qwen3.5-flash","Qwen3.5-Flash","Qwen Qwen3.5-Flash",1772053776,{"provider_id":2562,"slug":2563,"model_name":2564,"provider_name":375,"provider":2565,"is_open":37,"author_country":12,"release_date":2566,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":820,"input_price":793,"output_price":820,"benchmark_mmlu_pro":12,"benchmark_gpqa":1165,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-122b-a10b","qwen-qwen3.5-122b-a10b","Qwen3.5-122B-A10B","Qwen Qwen3.5-122B-A10B",1772053789,{"provider_id":2568,"slug":2569,"model_name":2570,"provider_name":375,"provider":2571,"is_open":37,"author_country":12,"release_date":2572,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":1827,"output_price_per_1m_tokens":312,"input_price":1827,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":513,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-27b","qwen-qwen3.5-27b","Qwen3.5-27B","Qwen Qwen3.5-27B",1772053810,{"provider_id":2574,"slug":2575,"model_name":2576,"provider_name":375,"provider":2577,"is_open":37,"author_country":12,"release_date":2578,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":2579,"output_price_per_1m_tokens":312,"input_price":2579,"output_price":312,"benchmark_mmlu_pro":12,"benchmark_gpqa":984,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-35b-a3b","qwen-qwen3.5-35b-a3b","Qwen3.5-35B-A3B","Qwen Qwen3.5-35B-A3B",1772053822,0.1625,{"provider_id":2581,"slug":2582,"model_name":2583,"provider_name":2398,"provider":2584,"is_open":11,"author_country":12,"release_date":2585,"release_month":2476,"context_length":1477,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"bytedance-seed:seed-2.0-mini","bytedance-seed-seed-2.0-mini","Seed 2.0 Mini","Bytedance-seed Seed 2.0 Mini",1772131107,{"provider_id":2587,"slug":2588,"model_name":2589,"provider_name":248,"provider":2590,"is_open":11,"author_country":12,"release_date":2591,"release_month":2592,"context_length":856,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":26,"input_price":143,"output_price":26,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"google:gemini-3.1-flash-lite-preview","google-gemini-3.1-flash-lite-preview","Gemini 3.1 Flash Lite Preview","Google Gemini 3.1 Flash Lite Preview",1772512673,"2026-03",{"provider_id":2594,"slug":2595,"model_name":2596,"provider_name":9,"provider":2597,"is_open":11,"author_country":12,"release_date":2598,"release_month":2592,"context_length":129,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.3-chat","openai-gpt-5.3-chat","GPT-5.3 Chat","OpenAI GPT-5.3 Chat",1772564061,{"provider_id":2600,"slug":2601,"model_name":2602,"provider_name":1277,"provider":2603,"is_open":37,"author_country":12,"release_date":2604,"release_month":2592,"context_length":129,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":60,"input_price":143,"output_price":60,"benchmark_mmlu_pro":12,"benchmark_gpqa":771,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"inception:mercury-2","inception-mercury-2","Mercury 2","Inception Mercury 2",1772636275,{"provider_id":2606,"slug":2607,"model_name":2608,"provider_name":9,"provider":2609,"is_open":11,"author_country":12,"release_date":2610,"release_month":2592,"context_length":2611,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":161,"input_price":220,"output_price":161,"benchmark_mmlu_pro":12,"benchmark_gpqa":767,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.4","openai-gpt-5.4","GPT-5.4","OpenAI GPT-5.4",1772734352,1050000,{"provider_id":2613,"slug":2614,"model_name":2615,"provider_name":9,"provider":2616,"is_open":11,"author_country":12,"release_date":2617,"release_month":2592,"context_length":2611,"input_price_per_1m_tokens":16,"output_price_per_1m_tokens":2618,"input_price":16,"output_price":2618,"benchmark_mmlu_pro":12,"benchmark_gpqa":12,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"openai:gpt-5.4-pro","openai-gpt-5.4-pro","GPT-5.4 Pro","OpenAI GPT-5.4 Pro",1772734366,180,{"provider_id":2620,"slug":2621,"model_name":2622,"provider_name":375,"provider":2623,"is_open":37,"author_country":12,"release_date":2624,"release_month":2592,"context_length":1477,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":273,"input_price":208,"output_price":273,"benchmark_mmlu_pro":12,"benchmark_gpqa":604,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"qwen:qwen3.5-9b","qwen-qwen3.5-9b","Qwen3.5 9B","Qwen Qwen3.5 9B",1773152396,{"provider_id":2626,"slug":2627,"model_name":2628,"provider_name":2398,"provider":2629,"is_open":11,"author_country":12,"release_date":2630,"release_month":2592,"context_length":1477,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":78,"input_price":143,"output_price":78,"benchmark_mmlu_pro":12,"benchmark_gpqa":888,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"bytedance-seed:seed-2.0-lite","bytedance-seed-seed-2.0-lite","Seed 2.0 Lite","Bytedance-seed Seed 2.0 Lite",1773157231,{"provider_id":2632,"slug":2633,"model_name":2634,"provider_name":1580,"provider":2635,"is_open":11,"author_country":12,"release_date":2636,"release_month":2592,"context_length":2379,"input_price_per_1m_tokens":182,"output_price_per_1m_tokens":69,"input_price":182,"output_price":69,"benchmark_mmlu_pro":12,"benchmark_gpqa":1844,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"z-ai:glm-5-turbo","z-ai-glm-5-turbo","GLM-5 Turbo","Z-ai GLM-5 Turbo",1773583573,{"provider_id":2638,"slug":2639,"model_name":2640,"provider_name":696,"provider":2641,"is_open":11,"author_country":12,"release_date":2642,"release_month":2592,"context_length":1939,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":182,"input_price":50,"output_price":182,"benchmark_mmlu_pro":12,"benchmark_gpqa":2323,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"minimax:minimax-m2.7","minimax-minimax-m2.7","MiniMax M2.7","Minimax MiniMax M2.7",1773836697,{"provider_id":2644,"slug":2645,"model_name":2646,"provider_name":2344,"provider":2647,"is_open":11,"author_country":12,"release_date":2648,"release_month":2592,"context_length":1477,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"benchmark_mmlu_pro":12,"benchmark_gpqa":1187,"benchmark_aider":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_aime":12,"benchmark_mmlu_pro_reasoning":12,"benchmark_gpqa_reasoning":12,"benchmark_aider_reasoning":12,"benchmark_livecodebench_reasoning":12,"benchmark_math_hard_reasoning":12,"benchmark_aime_reasoning":12,"benchmark_coding_reasoning":12,"benchmark_intelligence_reasoning":12,"benchmark_math_reasoning":12},"xiaomi:mimo-v2-omni","xiaomi-mimo-v2-omni","MiMo v2 Omni","Xiaomi MiMo v2 Omni",1773863703,[2650,2658,2662,2670,2678,2686,2696,2703,2712,2723,2736,2746,2769,2781,2794,2799,2813,2829,2853,2864,2870,2877,2889,2901,2909,2929,2937,2959,2966,2978,3006,3031,3047,3054,3062,3083,3112,3137,3144,3152,3161,3169,3193,3200,3207,3230,3240,3246,3276,3288,3294,3316,3322,3328,3331,3352,3359,3382,3390,3397,3405,3416,3420,3426,3431,3435,3455,3476,3491,3500,3508,3520,3542,3547,3556,3567,3579,3591,3598,3619,3626,3635,3642,3652,3660,3680,3685,3694,3698,3703,3708,3715,3733,3752,3768,3778,3793,3798,3815,3820,3835,3838,3848,3854,3866,3881,3886,3900,3921,3942,3955,3977,3985,3999,4006,4023,4036,4042,4055,4063,4076,4088,4096,4103,4112,4117,4128,4142,4149,4157,4164,4170,4184,4201,4208,4214,4223,4234,4244,4249,4263,4272,4275,4287,4293,4305,4311,4317,4325,4332,4337,4344,4349,4358,4364,4371,4375,4382,4391,4398,4407,4410,4419,4424,4434,4444,4459,4468,4481,4487,4492,4501,4508,4513,4524,4530,4535,4541,4549,4558,4564,4572,4574,4582,4591,4597,4608,4614,4624,4635,4642,4645,4650,4653,4661,4666,4675,4683,4688,4692,4696,4702,4708,4715,4722,4728,4734,4744,4750,4762,4769,4777,4782,4787,4793,4805,4811,4820,4825,4833,4840,4844,4851,4862,4868,4879,4884,4891,4895,4906,4912,4918,4923,4936,4944,4955,4965,4970,4975,4984,4989,4994,4997,5005,5010,5021,5028,5038,5043,5053,5060,5067,5074,5079,5083,5089,5094,5100,5104,5111],{"aa_id":2651,"ppt_model_id":2652,"slug":7,"model_name":8,"provider_name":9,"name":8,"provider":9,"aa_name":8,"is_open":11,"author_country":2653,"release_date":13,"release_month":14,"context_length":15,"inference_mode":2654,"input_price_per_1m_tokens":16,"output_price_per_1m_tokens":17,"input_price":16,"output_price":17,"tokens_per_second":2655,"time_to_first_token":2656,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":18,"benchmark_intelligence":2657,"benchmark_coding":1225},"ce50ec23-b95c-405e-917c-24569e6556f5","f4a855d0-ec6e-46c5-8b7f-6dcb29f76440","us","standard",31.332,0.746,12.8,{"aa_id":2659,"ppt_model_id":2660,"slug":21,"model_name":22,"provider_name":9,"name":22,"provider":9,"aa_name":22,"is_open":11,"author_country":2653,"release_date":13,"release_month":14,"context_length":24,"inference_mode":2654,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":26,"input_price":25,"output_price":26,"tokens_per_second":2661,"time_to_first_token":1364,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":28,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":30,"benchmark_mmlu_pro":27,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":29,"benchmark_intelligence":1241,"benchmark_coding":605},"fd87af35-0971-4e0d-9dfb-dc7fe6ddb96d","0a0447b6-7b51-43c9-a368-e7321099e0be",86.62,{"aa_id":2663,"ppt_model_id":2664,"slug":110,"model_name":111,"provider_name":2665,"name":111,"provider":2665,"aa_name":111,"is_open":37,"author_country":2666,"release_date":113,"release_month":114,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":116,"output_price_per_1m_tokens":117,"input_price":116,"output_price":117,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":2667,"benchmark_aime_25":12,"benchmark_gpqa":119,"benchmark_hle":545,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":2668,"benchmark_math_hard":121,"benchmark_mmlu_pro":118,"benchmark_scicode":2669,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":305},"ecc55009-a2db-4b92-a70a-bd21cb0944ed","9658aa51-f549-4534-8c33-23f671c58158","Mistral","fr",0,6.6000000000000005,2.8000000000000003,{"aa_id":2671,"ppt_model_id":2672,"slug":124,"model_name":125,"provider_name":2665,"name":125,"provider":2665,"aa_name":2673,"is_open":37,"author_country":2666,"release_date":127,"release_month":128,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":26,"input_price":25,"output_price":26,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":2667,"benchmark_aime_25":12,"benchmark_gpqa":2674,"benchmark_hle":2675,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":132,"benchmark_math_hard":133,"benchmark_mmlu_pro":130,"benchmark_scicode":2676,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2677},"f5b3ffde-6cd0-4baa-90ff-20fd53312ac8","44122d0b-2e39-4efd-9d92-5c9feda6492e","Mistral Large (Feb '24)",35.099999999999994,3.4000000000000004,20.8,9.9,{"aa_id":2679,"ppt_model_id":2680,"slug":136,"model_name":137,"provider_name":138,"name":137,"provider":138,"aa_name":137,"is_open":11,"author_country":2653,"release_date":140,"release_month":141,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":144,"input_price":143,"output_price":144,"tokens_per_second":2681,"time_to_first_token":2682,"benchmark_aime":61,"benchmark_aime_25":12,"benchmark_gpqa":145,"benchmark_hle":1875,"benchmark_ifbench":265,"benchmark_lcr":2683,"benchmark_livecodebench":147,"benchmark_math_hard":148,"benchmark_mmlu_pro":12,"benchmark_scicode":1755,"benchmark_tau2":2684,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":146,"benchmark_intelligence":2685,"benchmark_coding":429},"cb1d9cf3-cd59-4bee-a6c7-112a0b1854e0","074ea461-fc74-44bc-ab40-9acb51197c5b",134.777,0.436,21,21.099999999999998,12.3,{"aa_id":2687,"ppt_model_id":2688,"slug":151,"model_name":152,"provider_name":9,"name":152,"provider":9,"aa_name":152,"is_open":11,"author_country":2653,"release_date":154,"release_month":155,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":156,"output_price_per_1m_tokens":16,"input_price":156,"output_price":16,"tokens_per_second":2689,"time_to_first_token":2690,"benchmark_aime":161,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":2691,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":2692,"benchmark_math_hard":160,"benchmark_mmlu_pro":2693,"benchmark_scicode":2694,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":158,"benchmark_intelligence":961,"benchmark_coding":2695},"deb5c9a0-51b9-480b-bff9-3a7617a38d57","2db933de-4db3-41eb-877c-409cf837fc80",29.608,0.983,3.3000000000000003,29.099999999999998,69.39999999999999,31.900000000000002,21.5,{"aa_id":2697,"ppt_model_id":2698,"slug":177,"model_name":178,"provider_name":2665,"name":178,"provider":2665,"aa_name":178,"is_open":37,"author_country":2666,"release_date":180,"release_month":155,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":182,"output_price_per_1m_tokens":182,"input_price":182,"output_price":182,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":2667,"benchmark_aime_25":12,"benchmark_gpqa":184,"benchmark_hle":2699,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":2700,"benchmark_math_hard":2701,"benchmark_mmlu_pro":183,"benchmark_scicode":361,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2702},"524a76ea-bebc-43f4-ba4a-ec7b0820ffe6","d4807f66-8fb5-46f7-8ffe-ec4ab099aa82",4.1000000000000005,14.799999999999999,54.50000000000001,9.8,{"aa_id":2704,"ppt_model_id":2705,"slug":189,"model_name":190,"provider_name":2706,"name":190,"provider":2706,"aa_name":2707,"is_open":37,"author_country":2653,"release_date":193,"release_month":155,"context_length":194,"inference_mode":2654,"input_price_per_1m_tokens":195,"output_price_per_1m_tokens":196,"input_price":195,"output_price":196,"tokens_per_second":2708,"time_to_first_token":2709,"benchmark_aime":2667,"benchmark_aime_25":12,"benchmark_gpqa":198,"benchmark_hle":2710,"benchmark_ifbench":2022,"benchmark_lcr":2667,"benchmark_livecodebench":200,"benchmark_math_hard":201,"benchmark_mmlu_pro":197,"benchmark_scicode":2711,"benchmark_tau2":2667,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":199,"benchmark_intelligence":1110,"benchmark_coding":1014},"6a22ce42-7158-4942-a612-3299d1fa0e18","3bd4cf82-7445-48aa-888d-6fe424d981b0","Meta","Llama 3 Instruct 70B",40.514,0.425,4.3999999999999995,18.9,{"aa_id":2713,"ppt_model_id":2714,"slug":204,"model_name":205,"provider_name":2706,"name":205,"provider":2706,"aa_name":2715,"is_open":37,"author_country":2653,"release_date":193,"release_month":155,"context_length":194,"inference_mode":2654,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":208,"input_price":207,"output_price":208,"tokens_per_second":2716,"time_to_first_token":2717,"benchmark_aime":2667,"benchmark_aime_25":12,"benchmark_gpqa":2718,"benchmark_hle":2719,"benchmark_ifbench":2720,"benchmark_lcr":2667,"benchmark_livecodebench":211,"benchmark_math_hard":212,"benchmark_mmlu_pro":209,"benchmark_scicode":2721,"benchmark_tau2":2667,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2722,"benchmark_coding":69},"2276bc3d-f616-432a-8136-ff8caeeaa3ae","95ec6caa-ca3b-4552-a926-5654f189038d","Llama 3 Instruct 8B",82.035,0.379,29.599999999999998,5.1,24.6,11.899999999999999,6.4,{"aa_id":2724,"ppt_model_id":2725,"slug":215,"model_name":216,"provider_name":9,"name":216,"provider":9,"aa_name":2726,"is_open":11,"author_country":2653,"release_date":218,"release_month":219,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"tokens_per_second":2727,"time_to_first_token":2728,"benchmark_aime":2729,"benchmark_aime_25":12,"benchmark_gpqa":2730,"benchmark_hle":2731,"benchmark_ifbench":2337,"benchmark_lcr":2732,"benchmark_livecodebench":2096,"benchmark_math_hard":721,"benchmark_mmlu_pro":12,"benchmark_scicode":2733,"benchmark_tau2":2734,"benchmark_terminalbench":427,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":2735,"benchmark_aider":221},"0cd0d474-23a6-4305-8c0d-d5876ed25214","5d7b5410-39c9-4c54-8749-c8fb42798da4","GPT-4o (Aug '24)",86.069,0.541,11.700000000000001,52.1,2.9000000000000004,35,33.1,28.9,37.4966,{"aa_id":2737,"ppt_model_id":2738,"slug":269,"model_name":270,"provider_name":9,"name":270,"provider":9,"aa_name":2739,"is_open":11,"author_country":2653,"release_date":272,"release_month":261,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":274,"input_price":273,"output_price":274,"tokens_per_second":2740,"time_to_first_token":2741,"benchmark_aime":2729,"benchmark_aime_25":2742,"benchmark_gpqa":276,"benchmark_hle":69,"benchmark_ifbench":2743,"benchmark_lcr":12,"benchmark_livecodebench":2744,"benchmark_math_hard":279,"benchmark_mmlu_pro":275,"benchmark_scicode":2745,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2742,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":277,"benchmark_intelligence":1144},"bb63c42f-c412-4a45-8e28-df48b4c36eb9","00ad02db-6114-4289-a68e-f49b650d98ca","GPT-4o mini",50.165,0.501,14.7,31,23.400000000000002,22.900000000000002,{"aa_id":2747,"ppt_model_id":2748,"slug":308,"model_name":309,"provider_name":2706,"name":309,"provider":2706,"aa_name":2749,"is_open":37,"author_country":2653,"release_date":297,"release_month":261,"context_length":311,"inference_mode":2654,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":312,"input_price":312,"output_price":312,"tokens_per_second":2750,"time_to_first_token":2751,"benchmark_aime":317,"benchmark_aime_25":68,"benchmark_gpqa":130,"benchmark_hle":2752,"benchmark_ifbench":1071,"benchmark_lcr":1236,"benchmark_livecodebench":315,"benchmark_math_hard":316,"benchmark_mmlu_pro":313,"benchmark_scicode":121,"benchmark_tau2":1243,"benchmark_terminalbench":2753,"benchmark_accountingaudit":1201,"benchmark_agieval_zh":12,"benchmark_agieval_en":2754,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":2755,"benchmark_bbh":2756,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":2757,"benchmark_gaia":12,"benchmark_gsm8k":2758,"benchmark_humaneval":2759,"benchmark_ifeval":12,"benchmark_knights_and_knaves":2760,"benchmark_math":68,"benchmark_mbppplus":2761,"benchmark_medqa":2762,"benchmark_mmlu":2763,"benchmark_mmmu":2764,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":2765,"benchmark_swe_bench_lite":12,"benchmark_wmdp":2766,"benchmark_wmt":2767,"benchmark_aider":314,"benchmark_intelligence":1191,"benchmark_coding":2768},"bb5ebe1e-add9-4e48-9d20-6fc1ead1e3ec","9887ca4f-3eb4-470c-970a-96c578a34db3","Llama 3.1 Instruct 405B",30.896,0.468,4.2,6.800000000000001,63.6685,19.0708,89.0084,58.2,90.5882,67.0732,33.8571,36.7725,82.8751,37.0816,45.2381,33.3333,67.7476,38.0491,14.5,{"aa_id":2770,"ppt_model_id":2771,"slug":320,"model_name":321,"provider_name":2706,"name":321,"provider":2706,"aa_name":2772,"is_open":37,"author_country":2653,"release_date":297,"release_month":261,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":323,"output_price_per_1m_tokens":324,"input_price":323,"output_price":324,"tokens_per_second":2773,"time_to_first_token":2774,"benchmark_aime":2775,"benchmark_aime_25":69,"benchmark_gpqa":326,"benchmark_hle":2776,"benchmark_ifbench":2045,"benchmark_lcr":1004,"benchmark_livecodebench":2777,"benchmark_math_hard":329,"benchmark_mmlu_pro":2778,"benchmark_scicode":2779,"benchmark_tau2":1986,"benchmark_terminalbench":68,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":2780,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":69,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":327,"benchmark_intelligence":2094,"benchmark_coding":1712},"2691f7b8-06e7-47be-b786-3d2680d963ea","ae9825bc-800a-47f8-9aae-193a4991685c","Llama 3.1 Instruct 70B",30.784,0.535,17.299999999999997,4.6,23.200000000000003,67.60000000000001,26.700000000000003,14.0265,{"aa_id":2782,"ppt_model_id":2783,"slug":294,"model_name":295,"provider_name":2706,"name":295,"provider":2706,"aa_name":2784,"is_open":37,"author_country":2653,"release_date":297,"release_month":261,"context_length":298,"inference_mode":2654,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":299,"input_price":288,"output_price":299,"tokens_per_second":2785,"time_to_first_token":2786,"benchmark_aime":305,"benchmark_aime_25":2787,"benchmark_gpqa":2788,"benchmark_hle":2719,"benchmark_ifbench":2789,"benchmark_lcr":516,"benchmark_livecodebench":2790,"benchmark_math_hard":304,"benchmark_mmlu_pro":2791,"benchmark_scicode":2792,"benchmark_tau2":2793,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2787,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":302,"benchmark_intelligence":2073,"benchmark_coding":960},"16c7cb82-d6f6-40f5-a1ac-6394d139ca04","420c3d02-a2a3-48e0-8a23-44383ac5b45f","Llama 3.1 Instruct 8B",180.334,0.463,4.3,25.900000000000002,28.599999999999998,11.600000000000001,47.599999999999994,13.200000000000001,16.400000000000002,{"aa_id":12,"ppt_model_id":2795,"slug":349,"model_name":350,"provider_name":226,"name":350,"provider":226,"aa_name":12,"is_open":37,"author_country":2653,"release_date":352,"release_month":337,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":61,"input_price":61,"output_price":61,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":2797,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":2798,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":158},"cb0aba82-0a55-450a-bef4-1b53adb61ccd",76.6667,64.2298,51.2195,{"aa_id":2800,"ppt_model_id":2801,"slug":355,"model_name":356,"provider_name":2802,"name":356,"provider":2802,"aa_name":2803,"is_open":37,"author_country":2653,"release_date":358,"release_month":337,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":50,"input_price":50,"output_price":50,"tokens_per_second":2804,"time_to_first_token":2805,"benchmark_aime":363,"benchmark_aime_25":12,"benchmark_gpqa":360,"benchmark_hle":2699,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":361,"benchmark_math_hard":2806,"benchmark_mmlu_pro":2807,"benchmark_scicode":689,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":1188,"benchmark_agieval_zh":12,"benchmark_agieval_en":2808,"benchmark_arc_challenge":12,"benchmark_arc_easy":2809,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":2810,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":2811,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2812},"2e18981c-2d85-4524-9607-e7f97f650668","817f8335-76bb-47aa-9ce6-888fc5fed7a9","Nous Research","Hermes 3 - Llama-3.1 70B",35.57,0.334,53.800000000000004,57.099999999999994,62.4509,97.6431,24.0741,17.1059,10.6,{"aa_id":2814,"ppt_model_id":2815,"slug":407,"model_name":408,"provider_name":1833,"name":408,"provider":1833,"aa_name":2816,"is_open":37,"author_country":2817,"release_date":410,"release_month":403,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":411,"output_price_per_1m_tokens":324,"input_price":411,"output_price":324,"tokens_per_second":2818,"time_to_first_token":2819,"benchmark_aime":417,"benchmark_aime_25":2820,"benchmark_gpqa":413,"benchmark_hle":2752,"benchmark_ifbench":2821,"benchmark_lcr":2822,"benchmark_livecodebench":415,"benchmark_math_hard":416,"benchmark_mmlu_pro":412,"benchmark_scicode":2779,"benchmark_tau2":2071,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":2823,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":2824,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":2825,"benchmark_humaneval":2826,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":439,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":2827,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":414,"benchmark_intelligence":1068,"benchmark_coding":2828},"bd2fa4e3-7309-41cb-9a1c-b4b06d556ad7","945dfadf-da24-4062-8a33-db8ea9ee2020","Qwen2.5 Instruct 72B","cn",55.696,1.149,14.000000000000002,36.9,20.3,78.3537,72.4466,92.9492,82.3171,100,11.9,{"aa_id":2830,"ppt_model_id":2831,"slug":420,"model_name":421,"provider_name":2706,"name":421,"provider":2706,"aa_name":2832,"is_open":37,"author_country":2653,"release_date":423,"release_month":403,"context_length":424,"inference_mode":2654,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":299,"input_price":207,"output_price":299,"tokens_per_second":2833,"time_to_first_token":2834,"benchmark_aime":429,"benchmark_aime_25":2691,"benchmark_gpqa":426,"benchmark_hle":2835,"benchmark_ifbench":2836,"benchmark_lcr":78,"benchmark_livecodebench":427,"benchmark_math_hard":428,"benchmark_mmlu_pro":2837,"benchmark_scicode":2835,"benchmark_tau2":2684,"benchmark_terminalbench":12,"benchmark_accountingaudit":497,"benchmark_agieval_zh":12,"benchmark_agieval_en":2838,"benchmark_arc_challenge":2839,"benchmark_arc_easy":2840,"benchmark_bbeh":12,"benchmark_bbh":2841,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":1270,"benchmark_gaia":12,"benchmark_gsm8k":2842,"benchmark_humaneval":2843,"benchmark_ifeval":12,"benchmark_knights_and_knaves":2844,"benchmark_math":2845,"benchmark_mbppplus":2846,"benchmark_medqa":2847,"benchmark_mmlu":2848,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":2849,"benchmark_stock_bcs":2850,"benchmark_swe_bench_lite":12,"benchmark_wmdp":2851,"benchmark_wmt":2852,"benchmark_intelligence":985},"771d4144-38db-4f5c-9d04-6e8d901e5c8a","3f39f9b8-fb10-4d81-8279-cc2e2e0a5031","Llama 3.2 Instruct 3B",53.641,0.37,5.2,26.200000000000003,34.699999999999996,26.5122,56.314,78.5774,36.0043,30.8271,47.561,6.1429,74.3719,26.455,52.6316,15.3101,0.5086,8.3333,6.6798,25.1791,{"aa_id":2854,"ppt_model_id":2855,"slug":442,"model_name":443,"provider_name":2706,"name":443,"provider":2706,"aa_name":2856,"is_open":37,"author_country":2653,"release_date":423,"release_month":403,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":445,"output_price_per_1m_tokens":445,"input_price":445,"output_price":445,"tokens_per_second":2857,"time_to_first_token":2858,"benchmark_aime":450,"benchmark_aime_25":2859,"benchmark_gpqa":447,"benchmark_hle":2835,"benchmark_ifbench":2860,"benchmark_lcr":2729,"benchmark_livecodebench":448,"benchmark_math_hard":449,"benchmark_mmlu_pro":2861,"benchmark_scicode":2862,"benchmark_tau2":1332,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1940,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2863,"benchmark_coding":2787},"2eb1ec42-7590-4fe6-b447-26d6fead6b43","5941f3b1-615b-4cf4-825c-f6768eedda18","Llama 3.2 Instruct 11B (Vision)",82.499,0.375,1.7000000000000002,30.4,46.400000000000006,11.200000000000001,8.7,{"aa_id":2865,"ppt_model_id":2866,"slug":432,"model_name":433,"provider_name":2706,"name":433,"provider":2706,"aa_name":2867,"is_open":37,"author_country":2653,"release_date":423,"release_month":403,"context_length":435,"inference_mode":2654,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":288,"input_price":288,"output_price":288,"tokens_per_second":2868,"time_to_first_token":2869,"benchmark_aime":2667,"benchmark_aime_25":2667,"benchmark_gpqa":437,"benchmark_hle":1146,"benchmark_ifbench":229,"benchmark_lcr":505,"benchmark_livecodebench":438,"benchmark_math_hard":2820,"benchmark_mmlu_pro":436,"benchmark_scicode":2859,"benchmark_tau2":2667,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2667,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1004,"benchmark_coding":274},"2a8e2a83-4e48-4f7e-8374-612c562496ad","03c9847b-100b-454b-a8c8-a970b3fdbc76","Llama 3.2 Instruct 1B",91.717,0.543,{"aa_id":12,"ppt_model_id":2871,"slug":473,"model_name":474,"provider_name":467,"name":474,"provider":467,"aa_name":12,"is_open":11,"author_country":2653,"release_date":469,"release_month":470,"context_length":59,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":2667,"benchmark_agieval_zh":12,"benchmark_agieval_en":2872,"benchmark_arc_challenge":2873,"benchmark_arc_easy":2874,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":2875,"benchmark_math":12,"benchmark_mbppplus":2876,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"9b7d0e4e-f935-4f91-ab61-2e24ba857173",60.4167,89.2491,97.1801,12.4821,32.2751,{"aa_id":12,"ppt_model_id":2878,"slug":465,"model_name":466,"provider_name":467,"name":466,"provider":467,"aa_name":12,"is_open":11,"author_country":2653,"release_date":469,"release_month":470,"context_length":59,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":2667,"benchmark_agieval_zh":2879,"benchmark_agieval_en":12,"benchmark_arc_challenge":2873,"benchmark_arc_easy":2880,"benchmark_bbeh":2881,"benchmark_bbh":2882,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":2667,"benchmark_gaia":12,"benchmark_gsm8k":2883,"benchmark_humaneval":2884,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2885,"benchmark_mbppplus":2886,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":2887,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":2667,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":2888},"4aa2d796-292f-40fb-a59f-22562ebc44c0",49.7228,96.633,9.9558,28.2292,64.0364,48.1707,36.8874,30.504,41.9822,30.0241,{"aa_id":2890,"ppt_model_id":2891,"slug":478,"model_name":479,"provider_name":2892,"name":479,"provider":2892,"aa_name":2893,"is_open":11,"author_country":2653,"release_date":482,"release_month":470,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":312,"output_price_per_1m_tokens":312,"input_price":312,"output_price":312,"tokens_per_second":2894,"time_to_first_token":2895,"benchmark_aime":488,"benchmark_aime_25":448,"benchmark_gpqa":484,"benchmark_hle":2776,"benchmark_ifbench":2896,"benchmark_lcr":2897,"benchmark_livecodebench":2898,"benchmark_math_hard":487,"benchmark_mmlu_pro":483,"benchmark_scicode":603,"benchmark_tau2":689,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":448,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":485,"benchmark_intelligence":2899,"benchmark_coding":2900},"be7ccc43-9ec6-45c1-adbf-554827955b3d","74a33613-5b3a-4b73-b3f3-8941218ec08c","NVIDIA","Llama 3.1 Nemotron Instruct 70B",46.794,0.432,30.7,7.000000000000001,16.900000000000002,13.4,10.8,{"aa_id":2902,"ppt_model_id":2903,"slug":508,"model_name":509,"provider_name":138,"name":509,"provider":138,"aa_name":2904,"is_open":11,"author_country":2653,"release_date":504,"release_month":470,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":516,"benchmark_aime_25":12,"benchmark_gpqa":512,"benchmark_hle":1875,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":514,"benchmark_math_hard":2905,"benchmark_mmlu_pro":511,"benchmark_scicode":2906,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":513,"benchmark_intelligence":2907,"benchmark_coding":2908},"ce1dfb08-c08a-403a-a088-b8b58c8d63ee","a16d6f67-ae87-4af7-9372-c2f1142cb20c","Claude 3.5 Sonnet (Oct '24)",77.10000000000001,36.6,15.9,30.2,{"aa_id":2910,"ppt_model_id":2911,"slug":519,"model_name":520,"provider_name":138,"name":520,"provider":138,"aa_name":520,"is_open":11,"author_country":2653,"release_date":522,"release_month":523,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":69,"input_price":524,"output_price":69,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":2691,"benchmark_aime_25":12,"benchmark_gpqa":526,"benchmark_hle":2912,"benchmark_ifbench":959,"benchmark_lcr":603,"benchmark_livecodebench":527,"benchmark_math_hard":528,"benchmark_mmlu_pro":525,"benchmark_scicode":2913,"benchmark_tau2":2720,"benchmark_terminalbench":363,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":2914,"benchmark_arc_challenge":2915,"benchmark_arc_easy":12,"benchmark_bbeh":2916,"benchmark_bbh":2917,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":2262,"benchmark_gaia":12,"benchmark_gsm8k":2918,"benchmark_humaneval":2919,"benchmark_ifeval":12,"benchmark_knights_and_knaves":161,"benchmark_math":2920,"benchmark_mbppplus":2921,"benchmark_medqa":2922,"benchmark_mmlu":2923,"benchmark_mmmu":2924,"benchmark_multichallenge":12,"benchmark_simpleqa":2925,"benchmark_stock_bcs":497,"benchmark_swe_bench_lite":2926,"benchmark_wmdp":2927,"benchmark_wmt":2928,"benchmark_intelligence":1987,"benchmark_coding":605},"dbf399be-8a39-4a58-a333-19354eabdbc0","9236791b-0d39-46cb-ad9d-0f360bb2d151",3.5000000000000004,27.400000000000002,66.2215,90.3584,16.7068,77.0389,93.2525,75.6098,73.5587,33.8753,77.769,72.7603,54.3333,7.975,27.6667,64.2585,35.5634,{"aa_id":2930,"ppt_model_id":2931,"slug":548,"model_name":549,"provider_name":1833,"name":549,"provider":1833,"aa_name":2932,"is_open":37,"author_country":2817,"release_date":551,"release_month":523,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":552,"output_price_per_1m_tokens":524,"input_price":552,"output_price":524,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":558,"benchmark_aime_25":12,"benchmark_gpqa":2933,"benchmark_hle":2934,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":556,"benchmark_math_hard":557,"benchmark_mmlu_pro":553,"benchmark_scicode":2935,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":555,"benchmark_intelligence":2936},"8a28a24b-4341-468d-b0df-996876989ebe","95cf10d6-7c02-4837-aeef-252ee061c737","Qwen2.5 Coder Instruct 32B",41.699999999999996,3.8,27.1,12.9,{"aa_id":2938,"ppt_model_id":2939,"slug":561,"model_name":562,"provider_name":2665,"name":562,"provider":2665,"aa_name":2940,"is_open":37,"author_country":2666,"release_date":564,"release_month":523,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":565,"input_price":78,"output_price":565,"tokens_per_second":2941,"time_to_first_token":2942,"benchmark_aime":2897,"benchmark_aime_25":363,"benchmark_gpqa":567,"benchmark_hle":2943,"benchmark_ifbench":2071,"benchmark_lcr":2944,"benchmark_livecodebench":568,"benchmark_math_hard":2945,"benchmark_mmlu_pro":566,"benchmark_scicode":119,"benchmark_tau2":1644,"benchmark_terminalbench":12,"benchmark_accountingaudit":497,"benchmark_agieval_zh":2946,"benchmark_agieval_en":2947,"benchmark_arc_challenge":2948,"benchmark_arc_easy":12,"benchmark_bbeh":2949,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":2950,"benchmark_humaneval":2826,"benchmark_ifeval":12,"benchmark_knights_and_knaves":2951,"benchmark_math":2952,"benchmark_mbppplus":2953,"benchmark_medqa":2954,"benchmark_mmlu":2955,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":2956,"benchmark_stock_bcs":2957,"benchmark_swe_bench_lite":12,"benchmark_wmdp":2958,"benchmark_wmt":12,"benchmark_intelligence":439},"22a3643b-66dc-47f6-9e50-19916ffe0e03","8b180f1c-e6df-4f42-847d-ce83a3d5be39","Pixtral Large",53.942,0.452,3.5999999999999996,10.299999999999999,71.39999999999999,63.1098,64.6504,92.1502,14.7566,91.8878,31.4286,68.52,53.9683,78.3189,77.2326,16.736,16.6667,65.3217,{"aa_id":2960,"ppt_model_id":2961,"slug":573,"model_name":574,"provider_name":2665,"name":574,"provider":2665,"aa_name":2962,"is_open":37,"author_country":2666,"release_date":576,"release_month":523,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":565,"input_price":78,"output_price":565,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":450,"benchmark_aime_25":2667,"benchmark_gpqa":2963,"benchmark_hle":600,"benchmark_ifbench":2964,"benchmark_lcr":2859,"benchmark_livecodebench":2779,"benchmark_math_hard":2945,"benchmark_mmlu_pro":2965,"benchmark_scicode":2935,"benchmark_tau2":861,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2667,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":579,"benchmark_intelligence":880},"3eaef2fa-f153-47ff-a289-131b4ac5e9c4","95788946-0110-4c67-93af-7aa63b196a19","Mistral Large 2 (Jul '24)",47.199999999999996,31.6,68.30000000000001,{"aa_id":2967,"ppt_model_id":2968,"slug":583,"model_name":584,"provider_name":2665,"name":584,"provider":2665,"aa_name":2969,"is_open":11,"author_country":2666,"release_date":586,"release_month":523,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":565,"input_price":78,"output_price":565,"tokens_per_second":2970,"time_to_first_token":2971,"benchmark_aime":448,"benchmark_aime_25":2820,"benchmark_gpqa":588,"benchmark_hle":69,"benchmark_ifbench":2972,"benchmark_lcr":1146,"benchmark_livecodebench":2973,"benchmark_math_hard":590,"benchmark_mmlu_pro":2974,"benchmark_scicode":119,"benchmark_tau2":2896,"benchmark_terminalbench":2975,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":2976,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":2977,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":439,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":414,"benchmark_intelligence":1713,"benchmark_coding":1209},"a97d7008-459c-4d25-b94d-8cc1a0fcd26d","8bf2d997-f789-41f8-9c29-71cdfed2a48b","Mistral Large 2 (Nov '24)",37.477,0.489,31.2,29.299999999999997,69.69999999999999,6.1,64.4933,70.2503,{"aa_id":2979,"ppt_model_id":2980,"slug":593,"model_name":594,"provider_name":595,"name":594,"provider":595,"aa_name":2981,"is_open":11,"author_country":2653,"release_date":597,"release_month":598,"context_length":599,"inference_mode":2654,"input_price_per_1m_tokens":524,"output_price_per_1m_tokens":600,"input_price":524,"output_price":600,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":605,"benchmark_aime_25":2897,"benchmark_gpqa":212,"benchmark_hle":2675,"benchmark_ifbench":514,"benchmark_lcr":1243,"benchmark_livecodebench":603,"benchmark_math_hard":2982,"benchmark_mmlu_pro":601,"benchmark_scicode":2676,"benchmark_tau2":2820,"benchmark_terminalbench":2975,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":2983,"benchmark_agieval_en":2984,"benchmark_arc_challenge":2985,"benchmark_arc_easy":2986,"benchmark_bbeh":2987,"benchmark_bbh":2988,"benchmark_bfcl_v3":2989,"benchmark_bird_critic":12,"benchmark_darkbench":2990,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":2991,"benchmark_humaneval":2992,"benchmark_ifeval":2993,"benchmark_knights_and_knaves":2994,"benchmark_math":2995,"benchmark_mbppplus":2996,"benchmark_medqa":2997,"benchmark_mmlu":2998,"benchmark_mmmu":2999,"benchmark_multichallenge":3000,"benchmark_simpleqa":3001,"benchmark_stock_bcs":174,"benchmark_swe_bench_lite":3002,"benchmark_wmdp":3003,"benchmark_wmt":3004,"benchmark_aider":602,"benchmark_intelligence":3005,"benchmark_coding":448},"406ef766-0c07-4c3d-a35e-0ff3d8902aca","96fdf5d4-7b9e-41f7-88cf-d08da4adc334","Nova Pro",78.60000000000001,64.8004,65.5145,92.7474,98.8215,15.9292,83.8888,67.9351,42.7273,91.6603,76.8293,81.8854,28.2857,74.78,49.2064,79.3401,78.2581,50.0577,19.0476,12.5839,2.6667,67.0393,36.9146,13.5,{"aa_id":3007,"ppt_model_id":3008,"slug":608,"model_name":609,"provider_name":595,"name":609,"provider":595,"aa_name":3009,"is_open":11,"author_country":2653,"release_date":611,"release_month":598,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":612,"output_price_per_1m_tokens":116,"input_price":612,"output_price":116,"tokens_per_second":3010,"time_to_first_token":3011,"benchmark_aime":615,"benchmark_aime_25":565,"benchmark_gpqa":614,"benchmark_hle":3012,"benchmark_ifbench":3013,"benchmark_lcr":3014,"benchmark_livecodebench":2820,"benchmark_math_hard":316,"benchmark_mmlu_pro":613,"benchmark_scicode":3015,"benchmark_tau2":2820,"benchmark_terminalbench":26,"benchmark_accountingaudit":3016,"benchmark_agieval_zh":3017,"benchmark_agieval_en":3018,"benchmark_arc_challenge":3019,"benchmark_arc_easy":3020,"benchmark_bbeh":3021,"benchmark_bbh":3022,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3023,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3024,"benchmark_math":3025,"benchmark_mbppplus":3026,"benchmark_medqa":12,"benchmark_mmlu":3027,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3028,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3029,"benchmark_coding":3030},"cea4d0bc-e23b-4087-aa5a-c253c5568bc0","8960a348-2955-4923-9f79-50514da86499","Nova Micro",283.855,0.352,4.7,29.4,9.700000000000001,9.4,53.3333,56.153,55.6167,86.9454,95.8333,13.1637,61.5266,91.0538,19.2857,67.02,47.8836,68.9432,4.6694,10.3,4.1,{"aa_id":3032,"ppt_model_id":3033,"slug":618,"model_name":619,"provider_name":595,"name":619,"provider":595,"aa_name":3034,"is_open":11,"author_country":2653,"release_date":621,"release_month":598,"context_length":599,"inference_mode":2654,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":622,"input_price":41,"output_price":622,"tokens_per_second":3035,"time_to_first_token":3036,"benchmark_aime":605,"benchmark_aime_25":2897,"benchmark_gpqa":624,"benchmark_hle":2776,"benchmark_ifbench":1344,"benchmark_lcr":3037,"benchmark_livecodebench":625,"benchmark_math_hard":626,"benchmark_mmlu_pro":623,"benchmark_scicode":3038,"benchmark_tau2":3039,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3040,"benchmark_arc_challenge":12,"benchmark_arc_easy":3041,"benchmark_bbeh":12,"benchmark_bbh":3042,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3043,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":566,"benchmark_mbppplus":3044,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3045,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3046,"benchmark_coding":2719},"4ec24470-96fe-4c27-806b-cdd2d429b04d","720b8ab4-98ae-4cad-b01e-b2df3797898d","Nova Lite",183.28,0.396,17.7,13.900000000000002,17.5,65.7502,97.5168,59.0078,78.0488,50.7937,6.565,12.7,{"aa_id":3048,"ppt_model_id":3049,"slug":629,"model_name":630,"provider_name":2706,"name":630,"provider":2706,"aa_name":3050,"is_open":37,"author_country":2653,"release_date":632,"release_month":598,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":633,"input_price":495,"output_price":633,"tokens_per_second":3051,"time_to_first_token":2741,"benchmark_aime":16,"benchmark_aime_25":305,"benchmark_gpqa":635,"benchmark_hle":69,"benchmark_ifbench":3052,"benchmark_lcr":161,"benchmark_livecodebench":3053,"benchmark_math_hard":638,"benchmark_mmlu_pro":634,"benchmark_scicode":1254,"benchmark_tau2":723,"benchmark_terminalbench":68,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":305,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":636,"benchmark_intelligence":2768,"benchmark_coding":605},"1d59107b-195f-4d04-8b34-f23ead9bf7ef","7c664278-8746-4552-9447-a3c1c05928e6","Llama 3.3 Instruct 70B",87.34,47.099999999999994,28.799999999999997,{"aa_id":3055,"ppt_model_id":3056,"slug":648,"model_name":649,"provider_name":9,"name":649,"provider":9,"aa_name":649,"is_open":11,"author_country":2653,"release_date":651,"release_month":598,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":17,"input_price":161,"output_price":17,"tokens_per_second":3057,"time_to_first_token":3058,"benchmark_aime":656,"benchmark_aime_25":12,"benchmark_gpqa":653,"benchmark_hle":305,"benchmark_ifbench":316,"benchmark_lcr":1553,"benchmark_livecodebench":654,"benchmark_math_hard":655,"benchmark_mmlu_pro":652,"benchmark_scicode":614,"benchmark_tau2":3059,"benchmark_terminalbench":2936,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":513,"benchmark_intelligence":3060,"benchmark_coding":3061},"bb4a1fe1-629f-443f-87f5-0fe3e79fff8c","6c3e465d-f722-44fa-9d39-020c614383c9",106.259,22.018,62.6,30.8,20.5,{"aa_id":12,"ppt_model_id":3063,"slug":665,"model_name":666,"provider_name":667,"name":666,"provider":667,"aa_name":12,"is_open":37,"author_country":2817,"release_date":669,"release_month":598,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":671,"output_price_per_1m_tokens":672,"input_price":671,"output_price":672,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":3064,"benchmark_agieval_en":3065,"benchmark_arc_challenge":3066,"benchmark_arc_easy":3067,"benchmark_bbeh":3068,"benchmark_bbh":3069,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":1375,"benchmark_gaia":12,"benchmark_gsm8k":3070,"benchmark_humaneval":3071,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3072,"benchmark_math":3073,"benchmark_mbppplus":3074,"benchmark_medqa":3075,"benchmark_mmlu":3076,"benchmark_mmmu":3077,"benchmark_multichallenge":12,"benchmark_simpleqa":3078,"benchmark_stock_bcs":3079,"benchmark_swe_bench_lite":3080,"benchmark_wmdp":3081,"benchmark_wmt":3082,"benchmark_aider":673},"18bbec8a-17fe-4d36-81b8-6f1c6111a913",75.7761,76.198,93.9607,98.569,15.3862,69.8098,93.7832,87.1951,60.3333,83.12,51.0582,80.3109,83.4108,48.2222,23.0049,66.6667,29.097,71.7557,36.6432,{"aa_id":3084,"ppt_model_id":3085,"slug":683,"model_name":684,"provider_name":3086,"name":684,"provider":3086,"aa_name":3087,"is_open":37,"author_country":2653,"release_date":686,"release_month":680,"context_length":298,"inference_mode":2654,"input_price_per_1m_tokens":687,"output_price_per_1m_tokens":116,"input_price":687,"output_price":116,"tokens_per_second":3088,"time_to_first_token":195,"benchmark_aime":3089,"benchmark_aime_25":3090,"benchmark_gpqa":3091,"benchmark_hle":2699,"benchmark_ifbench":3092,"benchmark_lcr":2667,"benchmark_livecodebench":689,"benchmark_math_hard":690,"benchmark_mmlu_pro":2945,"benchmark_scicode":1254,"benchmark_tau2":2667,"benchmark_terminalbench":2934,"benchmark_accountingaudit":3079,"benchmark_agieval_zh":3093,"benchmark_agieval_en":3094,"benchmark_arc_challenge":3095,"benchmark_arc_easy":3096,"benchmark_bbeh":3097,"benchmark_bbh":3098,"benchmark_bfcl_v3":3099,"benchmark_bird_critic":12,"benchmark_darkbench":3100,"benchmark_formal_logic_exp":985,"benchmark_gaia":12,"benchmark_gsm8k":3101,"benchmark_humaneval":3102,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3103,"benchmark_math":3104,"benchmark_mbppplus":3105,"benchmark_medqa":3106,"benchmark_mmlu":3107,"benchmark_mmmu":3108,"benchmark_multichallenge":12,"benchmark_simpleqa":3109,"benchmark_stock_bcs":174,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":3110,"benchmark_wmt":12,"benchmark_intelligence":3111,"benchmark_coding":1002},"8668e182-c7cc-4050-a43a-efa2e3255e17","ba99fedf-a35e-45cf-bde8-57e8a17f61e5","Microsoft Azure","Phi-4",37.256,14.299999999999999,18,57.49999999999999,23.5,60.8093,68.2247,94.6154,98.9478,10.1327,39.3642,40.8467,49.543,91.2813,95.5414,38.2857,78.18,61.9048,77.8476,77.5744,39.6667,2.3116,58.0425,10.4,{"aa_id":3113,"ppt_model_id":3114,"slug":703,"model_name":704,"provider_name":3115,"name":704,"provider":3115,"aa_name":3116,"is_open":11,"author_country":2817,"release_date":706,"release_month":680,"context_length":707,"inference_mode":2654,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":78,"input_price":708,"output_price":78,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":2965,"benchmark_aime_25":3117,"benchmark_gpqa":710,"benchmark_hle":450,"benchmark_ifbench":1071,"benchmark_lcr":3118,"benchmark_livecodebench":712,"benchmark_math_hard":713,"benchmark_mmlu_pro":3119,"benchmark_scicode":3120,"benchmark_tau2":3121,"benchmark_terminalbench":2975,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":3122,"benchmark_agieval_en":3123,"benchmark_arc_challenge":3124,"benchmark_arc_easy":3125,"benchmark_bbeh":12,"benchmark_bbh":3126,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":3127,"benchmark_gaia":12,"benchmark_gsm8k":3128,"benchmark_humaneval":3129,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3130,"benchmark_math":3131,"benchmark_mbppplus":3132,"benchmark_medqa":3133,"benchmark_mmlu":12,"benchmark_mmmu":3134,"benchmark_multichallenge":12,"benchmark_simpleqa":3135,"benchmark_stock_bcs":3136,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":711,"benchmark_intelligence":361,"benchmark_coding":2907},"6aa30489-9f35-4f65-99a0-7cf9bfe42e6f","f2a8a356-ba23-4049-aff9-38503fdaca79","DeepSeek","DeepSeek R1 (Jan '25)",68,52.300000000000004,84.39999999999999,35.699999999999996,11.4,87.8365,87.6176,91.4676,97.9377,83.469,98.401,96.1576,97.4194,97.2583,92.7257,64.69,92.1445,50.6667,29.1493,91.6667,{"aa_id":3138,"ppt_model_id":3139,"slug":716,"model_name":717,"provider_name":3115,"name":717,"provider":3115,"aa_name":3140,"is_open":37,"author_country":2817,"release_date":719,"release_month":680,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":720,"output_price_per_1m_tokens":524,"input_price":720,"output_price":524,"tokens_per_second":3141,"time_to_first_token":3142,"benchmark_aime":725,"benchmark_aime_25":183,"benchmark_gpqa":722,"benchmark_hle":2975,"benchmark_ifbench":415,"benchmark_lcr":448,"benchmark_livecodebench":723,"benchmark_math_hard":724,"benchmark_mmlu_pro":721,"benchmark_scicode":2972,"benchmark_tau2":3143,"benchmark_terminalbench":26,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":183,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":417,"benchmark_coding":3121},"d72dfe7c-8281-448d-b744-8f64793f2f7c","ffb4c499-8b9d-4ac4-b3a3-a3de4450b353","DeepSeek R1 Distill Llama 70B",40.201,0.629,21.9,{"aa_id":3145,"ppt_model_id":3146,"slug":728,"model_name":729,"provider_name":730,"name":729,"provider":730,"aa_name":729,"is_open":11,"author_country":2653,"release_date":732,"release_month":680,"context_length":733,"inference_mode":2654,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":61,"input_price":61,"output_price":61,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":3147,"benchmark_aime_25":12,"benchmark_gpqa":3052,"benchmark_hle":3148,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":556,"benchmark_math_hard":3149,"benchmark_mmlu_pro":3150,"benchmark_scicode":2745,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3151},"a2439c01-fbe9-49b0-8e22-ecb0597d759a","3cc7597f-fb99-4436-a765-e0176e292104",48.699999999999996,7.3,81.69999999999999,68.89999999999999,15.5,{"aa_id":3153,"ppt_model_id":3154,"slug":740,"model_name":741,"provider_name":3115,"name":741,"provider":3115,"aa_name":3155,"is_open":11,"author_country":2817,"release_date":743,"release_month":680,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":744,"output_price_per_1m_tokens":744,"input_price":744,"output_price":744,"tokens_per_second":3156,"time_to_first_token":3157,"benchmark_aime":749,"benchmark_aime_25":3158,"benchmark_gpqa":746,"benchmark_hle":3159,"benchmark_ifbench":2745,"benchmark_lcr":3014,"benchmark_livecodebench":747,"benchmark_math_hard":748,"benchmark_mmlu_pro":745,"benchmark_scicode":302,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3158,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3160},"da2f37aa-39d8-4ce6-b51e-2bf7e07ba807","6737dbfe-77a1-4ad1-83bf-5076fe825a2d","DeepSeek R1 Distill Qwen 32B",45.824,0.304,63,5.5,17.2,{"aa_id":3162,"ppt_model_id":3163,"slug":752,"model_name":753,"provider_name":2665,"name":753,"provider":2665,"aa_name":3164,"is_open":37,"author_country":2666,"release_date":755,"release_month":680,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":251,"input_price":299,"output_price":251,"tokens_per_second":3165,"time_to_first_token":3166,"benchmark_aime":615,"benchmark_aime_25":2787,"benchmark_gpqa":27,"benchmark_hle":2699,"benchmark_ifbench":3167,"benchmark_lcr":2667,"benchmark_livecodebench":757,"benchmark_math_hard":758,"benchmark_mmlu_pro":756,"benchmark_scicode":3168,"benchmark_tau2":437,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2787,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3046},"0bfe5c11-4419-48d1-ae65-f81024a704f7","c8653ae4-7968-41d4-b29a-f91df3a0074a","Mistral Small 3",153.417,0.497,26.400000000000002,23.599999999999998,{"aa_id":3170,"ppt_model_id":3171,"slug":761,"model_name":762,"provider_name":9,"name":762,"provider":9,"aa_name":3172,"is_open":11,"author_country":2653,"release_date":764,"release_month":680,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":700,"output_price_per_1m_tokens":765,"input_price":700,"output_price":765,"tokens_per_second":3173,"time_to_first_token":3174,"benchmark_aime":771,"benchmark_aime_25":12,"benchmark_gpqa":767,"benchmark_hle":2863,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":769,"benchmark_math_hard":770,"benchmark_mmlu_pro":3175,"benchmark_scicode":3176,"benchmark_tau2":983,"benchmark_terminalbench":2753,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":3177,"benchmark_agieval_en":3178,"benchmark_arc_challenge":12,"benchmark_arc_easy":3179,"benchmark_bbeh":12,"benchmark_bbh":3180,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":3181,"benchmark_gaia":12,"benchmark_gsm8k":3182,"benchmark_humaneval":3183,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3184,"benchmark_math":3185,"benchmark_mbppplus":3186,"benchmark_medqa":3187,"benchmark_mmlu":3188,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3189,"benchmark_stock_bcs":3190,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3191,"benchmark_wmt":12,"benchmark_aider":768,"benchmark_intelligence":301,"benchmark_coding":3192},"19e15343-883e-499c-9d3b-d5afec0d7fe7","8efa97d0-087d-4c20-baa5-6b96f742d376","o3-mini",137.265,7.173,79.10000000000001,39.900000000000006,74.7506,81.8932,98.6111,84.3956,99.8,95.2237,95.122,99.7143,93.08,63.2275,91.359,88.9265,13.9917,83.3333,80.4938,17.9,{"aa_id":3194,"ppt_model_id":3195,"slug":774,"model_name":775,"provider_name":1833,"name":775,"provider":1833,"aa_name":3196,"is_open":11,"author_country":2817,"release_date":777,"release_month":778,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":779,"output_price_per_1m_tokens":780,"input_price":779,"output_price":780,"tokens_per_second":3197,"time_to_first_token":3198,"benchmark_aime":603,"benchmark_aime_25":12,"benchmark_gpqa":3199,"benchmark_hle":545,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":784,"benchmark_math_hard":785,"benchmark_mmlu_pro":781,"benchmark_scicode":917,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":783,"benchmark_intelligence":811},"e3d16a21-4130-450a-8de7-14a77d0f32ea","cbc11c05-ab40-4b56-a2a5-14d3fe8c7cea","Qwen2.5 Max",47.118,1.101,58.699999999999996,{"aa_id":3201,"ppt_model_id":3202,"slug":803,"model_name":804,"provider_name":1833,"name":804,"provider":1833,"aa_name":3203,"is_open":11,"author_country":2817,"release_date":806,"release_month":778,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":807,"output_price_per_1m_tokens":808,"input_price":807,"output_price":808,"tokens_per_second":3204,"time_to_first_token":3205,"benchmark_aime":558,"benchmark_aime_25":12,"benchmark_gpqa":810,"benchmark_hle":2752,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":811,"benchmark_math_hard":812,"benchmark_mmlu_pro":809,"benchmark_scicode":3206,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":558},"8e026e69-91cb-4122-823c-b63c06e6b441","f51ec7b3-65c0-4d66-9b5b-1c4ad453e80d","Qwen2.5 Turbo",66.709,1.104,15.299999999999999,{"aa_id":3208,"ppt_model_id":3209,"slug":852,"model_name":853,"provider_name":248,"name":853,"provider":248,"aa_name":3210,"is_open":11,"author_country":2653,"release_date":855,"release_month":778,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":861,"benchmark_aime_25":3211,"benchmark_gpqa":858,"benchmark_hle":1146,"benchmark_ifbench":722,"benchmark_lcr":3212,"benchmark_livecodebench":859,"benchmark_math_hard":860,"benchmark_mmlu_pro":857,"benchmark_scicode":3213,"benchmark_tau2":556,"benchmark_terminalbench":2934,"benchmark_accountingaudit":2667,"benchmark_agieval_zh":3214,"benchmark_agieval_en":3215,"benchmark_arc_challenge":3216,"benchmark_arc_easy":3217,"benchmark_bbeh":3218,"benchmark_bbh":3219,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3220,"benchmark_humaneval":3221,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3222,"benchmark_math":3223,"benchmark_mbppplus":3224,"benchmark_medqa":3225,"benchmark_mmlu":3226,"benchmark_mmmu":483,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3227,"benchmark_wmt":3228,"benchmark_intelligence":904,"benchmark_coding":3229},"ef0c15a7-c6cb-427e-878d-5b500a8a5b01","32aa4ea8-eae9-48bf-91b7-8e025406c132","Gemini 2.0 Flash (Feb '25)",21.7,28.299999999999997,33.300000000000004,73.2816,73.4093,94.198,98.7795,18.5499,88.3181,95.0608,87.8049,52.8571,90.7391,61.1111,83.1893,84.7792,72.0011,38.8689,13.6,{"aa_id":3231,"ppt_model_id":3232,"slug":864,"model_name":865,"provider_name":9,"name":865,"provider":9,"aa_name":3233,"is_open":11,"author_country":2653,"release_date":867,"release_month":778,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":700,"output_price_per_1m_tokens":765,"input_price":700,"output_price":765,"tokens_per_second":3234,"time_to_first_token":3235,"benchmark_aime":871,"benchmark_aime_25":12,"benchmark_gpqa":638,"benchmark_hle":2685,"benchmark_ifbench":3236,"benchmark_lcr":3237,"benchmark_livecodebench":869,"benchmark_math_hard":870,"benchmark_mmlu_pro":868,"benchmark_scicode":3238,"benchmark_tau2":3239,"benchmark_terminalbench":2975,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":757,"benchmark_coding":330},"b05ca06f-a2b5-46a4-b65b-d7e7fd35307a","84555602-c3e6-4535-b03f-3f4b09bba542","o3-mini (high)",138.708,24.465,67.10000000000001,39.300000000000004,39.800000000000004,31.3,{"aa_id":3241,"ppt_model_id":3242,"slug":874,"model_name":875,"provider_name":2665,"name":875,"provider":2665,"aa_name":3243,"is_open":37,"author_country":2666,"release_date":877,"release_month":778,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":274,"input_price":377,"output_price":274,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":880,"benchmark_aime_25":12,"benchmark_gpqa":879,"benchmark_hle":2699,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":18,"benchmark_mmlu_pro":878,"benchmark_scicode":3244,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3245},"73cb1d6a-6a62-41d9-922e-adc0d40c874b","1bca1253-5ca7-4fcb-a44b-79ae65c16ab9","Mistral Saba",24.099999999999998,12.1,{"aa_id":3247,"ppt_model_id":3248,"slug":883,"model_name":3249,"provider_name":138,"name":884,"provider":138,"aa_name":3249,"is_open":11,"author_country":2653,"release_date":886,"release_month":778,"context_length":142,"inference_mode":3250,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":3147,"benchmark_aime_25":894,"benchmark_gpqa":511,"benchmark_hle":2944,"benchmark_ifbench":201,"benchmark_lcr":3251,"benchmark_livecodebench":892,"benchmark_math_hard":3252,"benchmark_mmlu_pro":891,"benchmark_scicode":3253,"benchmark_tau2":3254,"benchmark_terminalbench":1023,"benchmark_accountingaudit":3255,"benchmark_agieval_zh":12,"benchmark_agieval_en":3256,"benchmark_arc_challenge":3257,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3258,"benchmark_bfcl_v3":12,"benchmark_bird_critic":3259,"benchmark_darkbench":3260,"benchmark_formal_logic_exp":3261,"benchmark_gaia":3262,"benchmark_gsm8k":3263,"benchmark_humaneval":3264,"benchmark_ifeval":3265,"benchmark_knights_and_knaves":12,"benchmark_math":3266,"benchmark_mbppplus":3267,"benchmark_medqa":3268,"benchmark_mmlu":3269,"benchmark_mmmu":3270,"benchmark_multichallenge":12,"benchmark_simpleqa":3271,"benchmark_stock_bcs":3272,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3273,"benchmark_wmt":3274,"benchmark_aider":329,"benchmark_livecodebench_reasoning":892,"benchmark_mmlu_pro_reasoning":891,"benchmark_gpqa_reasoning":511,"benchmark_math_hard_reasoning":893,"benchmark_aime_reasoning":737,"benchmark_aime_25_reasoning":894,"benchmark_hle_reasoning":3029,"benchmark_scicode_reasoning":1628,"benchmark_ifbench_reasoning":201,"benchmark_lcr_reasoning":3275,"benchmark_terminalbench_reasoning":1023,"benchmark_tau2_reasoning":3254,"benchmark_intelligence":3060,"benchmark_coding":580,"benchmark_intelligence_reasoning":425,"benchmark_coding_reasoning":415,"benchmark_math_reasoning":894},"3f2869f7-7fb2-462a-807f-7c80560c4b9c","ab4d3f3f-c47a-4ba7-aaad-2da29170204b","Claude 3.7 Sonnet (Reasoning)","reasoning",60.699999999999996,94.69999999999999,40.300000000000004,54.7,86.6667,87.5494,94.7099,90.972,29.6667,27.7273,95.5868,43.949,95.3632,96.1783,88.5338,89.0438,62.1333,92.2652,85.3012,66.8889,32.7785,58.3333,78.2443,37.4222,60.7,{"aa_id":3277,"ppt_model_id":3248,"slug":883,"model_name":884,"provider_name":138,"name":884,"provider":138,"aa_name":3278,"is_open":11,"author_country":2653,"release_date":886,"release_month":778,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":890,"benchmark_aime_25":2683,"benchmark_gpqa":3279,"benchmark_hle":3280,"benchmark_ifbench":1324,"benchmark_lcr":201,"benchmark_livecodebench":148,"benchmark_math_hard":889,"benchmark_mmlu_pro":3281,"benchmark_scicode":302,"benchmark_tau2":497,"benchmark_terminalbench":1023,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":3282,"benchmark_arc_challenge":3257,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3258,"benchmark_bfcl_v3":12,"benchmark_bird_critic":3259,"benchmark_darkbench":3283,"benchmark_formal_logic_exp":2323,"benchmark_gaia":3262,"benchmark_gsm8k":3284,"benchmark_humaneval":3285,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3266,"benchmark_mbppplus":3286,"benchmark_medqa":3287,"benchmark_mmlu":3269,"benchmark_mmmu":3270,"benchmark_multichallenge":12,"benchmark_simpleqa":3271,"benchmark_stock_bcs":3272,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3273,"benchmark_wmt":12,"benchmark_aider":329,"benchmark_livecodebench_reasoning":892,"benchmark_mmlu_pro_reasoning":891,"benchmark_gpqa_reasoning":511,"benchmark_math_hard_reasoning":893,"benchmark_aime_reasoning":737,"benchmark_aime_25_reasoning":894,"benchmark_hle_reasoning":3029,"benchmark_scicode_reasoning":1628,"benchmark_ifbench_reasoning":201,"benchmark_lcr_reasoning":3275,"benchmark_terminalbench_reasoning":1023,"benchmark_tau2_reasoning":3254,"benchmark_intelligence":3060,"benchmark_coding":580,"benchmark_intelligence_reasoning":425,"benchmark_coding_reasoning":415,"benchmark_math_reasoning":894},"aaa518a3-7399-44e6-b1fc-2f5f3ecc91d6","Claude 3.7 Sonnet (Non-reasoning)",65.60000000000001,4.8,80.30000000000001,74.0377,31.5152,95.8302,92.0732,60.582,87.5884,{"aa_id":3289,"ppt_model_id":3290,"slug":897,"model_name":898,"provider_name":248,"name":898,"provider":248,"aa_name":3291,"is_open":11,"author_country":2653,"release_date":900,"release_month":778,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":901,"output_price_per_1m_tokens":50,"input_price":901,"output_price":50,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":3292,"benchmark_aime_25":12,"benchmark_gpqa":903,"benchmark_hle":2943,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":904,"benchmark_math_hard":905,"benchmark_mmlu_pro":3293,"benchmark_scicode":174,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2742},"4ec9587c-7fb3-4e1f-a0e8-c8b76ae8d4f5","7a71ae60-e155-4747-910b-9a43b51bec3b","Gemini 2.0 Flash-Lite (Feb '25)",27.700000000000003,72.39999999999999,{"aa_id":3295,"ppt_model_id":3296,"slug":909,"model_name":910,"provider_name":1833,"name":910,"provider":1833,"aa_name":910,"is_open":37,"author_country":2817,"release_date":912,"release_month":913,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":914,"input_price":273,"output_price":914,"tokens_per_second":3297,"time_to_first_token":3298,"benchmark_aime":1943,"benchmark_aime_25":3299,"benchmark_gpqa":1553,"benchmark_hle":3300,"benchmark_ifbench":3301,"benchmark_lcr":174,"benchmark_livecodebench":3302,"benchmark_math_hard":943,"benchmark_mmlu_pro":1876,"benchmark_scicode":614,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":3303,"benchmark_agieval_en":3304,"benchmark_arc_challenge":3305,"benchmark_arc_easy":3306,"benchmark_bbeh":12,"benchmark_bbh":3307,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":3308,"benchmark_gaia":12,"benchmark_gsm8k":3309,"benchmark_humaneval":3310,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3311,"benchmark_mbppplus":3312,"benchmark_medqa":3313,"benchmark_mmlu":3314,"benchmark_mmmu":3315,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":3079,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":916,"benchmark_intelligence":1986},"f08eea83-6b3a-476b-a641-5252c8aef040","ba9d63c2-da30-416b-ac0c-c9b58e002f0b",33.037,0.438,28.999999999999996,8.200000000000001,38.800000000000004,63.1,87.2714,88.0113,94.7009,98.7368,81.1572,89.5372,94.0439,95.5128,92.0996,62.069,86.4608,85.9475,52.8814,{"aa_id":3317,"ppt_model_id":3296,"slug":909,"model_name":910,"provider_name":1833,"name":910,"provider":1833,"aa_name":3318,"is_open":37,"author_country":2817,"release_date":912,"release_month":913,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":914,"input_price":273,"output_price":914,"tokens_per_second":3319,"time_to_first_token":3320,"benchmark_aime":3321,"benchmark_aime_25":12,"benchmark_gpqa":915,"benchmark_hle":3280,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":917,"benchmark_math_hard":918,"benchmark_mmlu_pro":275,"benchmark_scicode":2934,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":3303,"benchmark_agieval_en":3304,"benchmark_arc_challenge":3305,"benchmark_arc_easy":3306,"benchmark_bbeh":12,"benchmark_bbh":3307,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":3308,"benchmark_gaia":12,"benchmark_gsm8k":3309,"benchmark_humaneval":3310,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3311,"benchmark_mbppplus":3312,"benchmark_medqa":3313,"benchmark_mmlu":3314,"benchmark_mmmu":3315,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":3079,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":916,"benchmark_intelligence":1986},"19142987-e968-4163-9fd0-3e4c96637507","QwQ 32B-Preview",46.731,0.308,45.300000000000004,{"aa_id":3323,"ppt_model_id":3324,"slug":928,"model_name":929,"provider_name":730,"name":929,"provider":730,"aa_name":929,"is_open":11,"author_country":2653,"release_date":931,"release_month":913,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":3299,"benchmark_aime_25":12,"benchmark_gpqa":933,"benchmark_hle":3325,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":3326,"benchmark_math_hard":935,"benchmark_mmlu_pro":932,"benchmark_scicode":3327,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1986},"21ad274d-2ac9-4abd-98c7-b7cde217033e","98f74611-a319-44e2-979a-6e3c524c647f",7.9,27.500000000000004,22.6,{"aa_id":3329,"ppt_model_id":3330,"slug":939,"model_name":940,"provider_name":730,"name":940,"provider":730,"aa_name":940,"is_open":11,"author_country":2653,"release_date":942,"release_month":913,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":944,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":943,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2720},"f2a70277-f1bd-45e9-8965-31f0f979f7b3","98f11bcf-8ac5-4beb-bf27-6c992e13033e",{"aa_id":3332,"ppt_model_id":3333,"slug":953,"model_name":954,"provider_name":248,"name":954,"provider":248,"aa_name":3334,"is_open":37,"author_country":2653,"release_date":956,"release_month":913,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":957,"input_price":251,"output_price":957,"tokens_per_second":3335,"time_to_first_token":3336,"benchmark_aime":963,"benchmark_aime_25":3337,"benchmark_gpqa":959,"benchmark_hle":3012,"benchmark_ifbench":2349,"benchmark_lcr":230,"benchmark_livecodebench":3338,"benchmark_math_hard":962,"benchmark_mmlu_pro":958,"benchmark_scicode":1023,"benchmark_tau2":2322,"benchmark_terminalbench":2934,"benchmark_accountingaudit":2765,"benchmark_agieval_zh":3339,"benchmark_agieval_en":3340,"benchmark_arc_challenge":3341,"benchmark_arc_easy":3342,"benchmark_bbeh":12,"benchmark_bbh":3343,"benchmark_bfcl_v3":12,"benchmark_bird_critic":3344,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3345,"benchmark_ifeval":2993,"benchmark_knights_and_knaves":3346,"benchmark_math":3347,"benchmark_mbppplus":3348,"benchmark_medqa":3349,"benchmark_mmlu":12,"benchmark_mmmu":3350,"benchmark_multichallenge":12,"benchmark_simpleqa":3351,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":960,"benchmark_intelligence":3029,"benchmark_coding":211},"49d3c1a9-9c6c-4eec-9c11-d430a434e49a","ab811b00-eb92-46b5-ad1d-90923515188e","Gemma 3 27B Instruct",30.194,1.344,20.7,13.700000000000001,60.3381,65.1218,90.9556,98.2323,76.6088,25.7525,85.3659,57.5714,84.92,59.7884,67.4784,53.8889,8.4659,{"aa_id":3353,"ppt_model_id":3354,"slug":966,"model_name":967,"provider_name":3355,"name":967,"provider":3355,"aa_name":967,"is_open":11,"author_country":12,"release_date":970,"release_month":913,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":377,"input_price":495,"output_price":377,"tokens_per_second":3356,"time_to_first_token":3357,"benchmark_aime":974,"benchmark_aime_25":917,"benchmark_gpqa":3358,"benchmark_hle":2719,"benchmark_ifbench":2860,"benchmark_lcr":2667,"benchmark_livecodebench":972,"benchmark_math_hard":973,"benchmark_mmlu_pro":958,"benchmark_scicode":2779,"benchmark_tau2":2667,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":917,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1555,"benchmark_coding":1110},"10de79e2-2134-4487-bc03-08e5952a1a9f","f2514c14-b66c-4cae-a25e-80ce678f70fc","Reka AI",88.77,1.26,52.900000000000006,{"aa_id":3360,"ppt_model_id":3361,"slug":977,"model_name":978,"provider_name":385,"name":978,"provider":385,"aa_name":978,"is_open":37,"author_country":3362,"release_date":980,"release_month":913,"context_length":981,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":156,"input_price":220,"output_price":156,"tokens_per_second":3363,"time_to_first_token":3364,"benchmark_aime":3014,"benchmark_aime_25":880,"benchmark_gpqa":133,"benchmark_hle":2776,"benchmark_ifbench":1644,"benchmark_lcr":3090,"benchmark_livecodebench":983,"benchmark_math_hard":3365,"benchmark_mmlu_pro":982,"benchmark_scicode":3366,"benchmark_tau2":1986,"benchmark_terminalbench":524,"benchmark_accountingaudit":1188,"benchmark_agieval_zh":3367,"benchmark_agieval_en":3368,"benchmark_arc_challenge":3369,"benchmark_arc_easy":2986,"benchmark_bbeh":3370,"benchmark_bbh":3371,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":1208,"benchmark_gaia":12,"benchmark_gsm8k":3372,"benchmark_humaneval":3373,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3374,"benchmark_math":3375,"benchmark_mbppplus":3376,"benchmark_medqa":3377,"benchmark_mmlu":3378,"benchmark_mmmu":3379,"benchmark_multichallenge":12,"benchmark_simpleqa":3380,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3381,"benchmark_wmt":12,"benchmark_aider":558,"benchmark_intelligence":3005,"benchmark_coding":2677},"b0544174-3e2f-4999-85f4-099a13710654","f2ed2885-83ef-4c98-9b50-846e93e25baf","ca",37.629,0.486,81.89999999999999,28.1,73.6419,70.1493,93.686,17.0638,79.573,94.6171,82.9268,39.1429,77.16,53.1746,73.2914,84.055,37.8889,15.8223,69.5581,{"aa_id":3383,"ppt_model_id":3384,"slug":988,"model_name":989,"provider_name":248,"name":989,"provider":248,"aa_name":3385,"is_open":37,"author_country":2653,"release_date":991,"release_month":913,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":808,"input_price":208,"output_price":808,"tokens_per_second":3386,"time_to_first_token":3387,"benchmark_aime":995,"benchmark_aime_25":3388,"benchmark_gpqa":993,"benchmark_hle":3280,"benchmark_ifbench":1686,"benchmark_lcr":429,"benchmark_livecodebench":3338,"benchmark_math_hard":994,"benchmark_mmlu_pro":992,"benchmark_scicode":1191,"benchmark_tau2":2900,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3388,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3389,"benchmark_coding":1004},"538dd80b-7d02-473c-9c08-82a0f0dd4f54","bd0757d3-514c-44f1-94d3-4b7072fc9d88","Gemma 3 12B Instruct",30.836,14.17,18.3,8.8,{"aa_id":3391,"ppt_model_id":3392,"slug":998,"model_name":999,"provider_name":248,"name":999,"provider":248,"aa_name":3393,"is_open":37,"author_country":2653,"release_date":1001,"release_month":913,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":251,"input_price":208,"output_price":251,"tokens_per_second":3394,"time_to_first_token":3395,"benchmark_aime":1004,"benchmark_aime_25":3046,"benchmark_gpqa":2692,"benchmark_hle":2835,"benchmark_ifbench":3212,"benchmark_lcr":230,"benchmark_livecodebench":2862,"benchmark_math_hard":1003,"benchmark_mmlu_pro":2933,"benchmark_scicode":3148,"benchmark_tau2":505,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3046,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1004,"benchmark_coding":3396},"3bd370fb-6689-46b9-a110-27941ba34fe4","2a804eb1-bcce-4ba1-b9ea-5b62f420c17c","Gemma 3 4B Instruct",33.323,1.092,2.9,{"aa_id":3398,"ppt_model_id":3399,"slug":1007,"model_name":1008,"provider_name":3400,"name":1008,"provider":3400,"aa_name":3401,"is_open":37,"author_country":2653,"release_date":1011,"release_month":913,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":2691,"benchmark_gpqa":3402,"benchmark_hle":3403,"benchmark_ifbench":514,"benchmark_lcr":2667,"benchmark_livecodebench":2753,"benchmark_math_hard":12,"benchmark_mmlu_pro":1012,"benchmark_scicode":615,"benchmark_tau2":2667,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":529,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2812,"benchmark_coding":3404},"d16d409d-40e2-4dcb-8428-1be9e8aaf9ad","4e2589da-61c6-46f4-a08a-a68c6fb7a4e1","Allen Institute for AI","OLMo 2 32B",32.800000000000004,3.6999999999999997,2.7,{"aa_id":3406,"ppt_model_id":3407,"slug":1017,"model_name":1018,"provider_name":2665,"name":1018,"provider":2665,"aa_name":3408,"is_open":37,"author_country":2666,"release_date":1020,"release_month":913,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":86,"input_price":207,"output_price":86,"tokens_per_second":3409,"time_to_first_token":3410,"benchmark_aime":450,"benchmark_aime_25":3403,"benchmark_gpqa":1022,"benchmark_hle":3280,"benchmark_ifbench":121,"benchmark_lcr":2295,"benchmark_livecodebench":1023,"benchmark_math_hard":1024,"benchmark_mmlu_pro":1021,"benchmark_scicode":3411,"benchmark_tau2":3412,"benchmark_terminalbench":3413,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3414,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2768,"benchmark_coding":3415},"e291bb26-d16f-4380-971a-11d1901b275f","598628c8-8462-465e-b26f-8f7296280493","Mistral Small 3.1",154.584,0.483,26.5,25.1,7.6,3.7,13.9,{"aa_id":3417,"ppt_model_id":3418,"slug":1027,"model_name":1028,"provider_name":9,"name":1028,"provider":9,"aa_name":1028,"is_open":11,"author_country":2653,"release_date":1030,"release_month":913,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":1031,"output_price_per_1m_tokens":1032,"input_price":1031,"output_price":1032,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3419},"7c9944bd-655d-4054-a099-7e2693df521e","8cd3a60e-3231-4c91-92e0-51c97bda597c",25.8,{"aa_id":3421,"ppt_model_id":3422,"slug":1035,"model_name":1036,"provider_name":3115,"name":1036,"provider":3115,"aa_name":1036,"is_open":37,"author_country":2817,"release_date":1038,"release_month":913,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":1039,"input_price":377,"output_price":1039,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":3423,"benchmark_aime_25":810,"benchmark_gpqa":1342,"benchmark_hle":2835,"benchmark_ifbench":810,"benchmark_lcr":810,"benchmark_livecodebench":209,"benchmark_math_hard":3424,"benchmark_mmlu_pro":3365,"benchmark_scicode":614,"benchmark_tau2":3052,"benchmark_terminalbench":1986,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1254,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1041,"benchmark_intelligence":1210,"benchmark_coding":3425},"749ee6fd-7ce9-4f93-9057-b994a8793e00","5b342e92-5b32-4202-925d-8946c0c00075",52,94.19999999999999,16.4,{"aa_id":3427,"ppt_model_id":3422,"slug":1035,"model_name":1036,"provider_name":3115,"name":1036,"provider":3115,"aa_name":3428,"is_open":37,"author_country":2817,"release_date":1038,"release_month":913,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":1039,"input_price":377,"output_price":1039,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":963,"benchmark_aime_25":1254,"benchmark_gpqa":915,"benchmark_hle":2943,"benchmark_ifbench":3429,"benchmark_lcr":3299,"benchmark_livecodebench":784,"benchmark_math_hard":1042,"benchmark_mmlu_pro":1040,"benchmark_scicode":3430,"benchmark_tau2":229,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1254,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1041,"benchmark_intelligence":1210,"benchmark_coding":3425},"cdaeb06f-0209-48f0-9d87-06cc9913bc62","DeepSeek V3 (Dec '24)",34.8,35.4,{"aa_id":3432,"ppt_model_id":3433,"slug":1045,"model_name":1046,"provider_name":1833,"name":1046,"provider":1833,"aa_name":3434,"is_open":37,"author_country":2817,"release_date":1048,"release_month":913,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":274,"input_price":377,"output_price":274,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":448,"benchmark_aime_25":12,"benchmark_gpqa":1049,"benchmark_hle":2934,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":1050,"benchmark_math_hard":812,"benchmark_mmlu_pro":2974,"benchmark_scicode":2745,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1242},"6dce7b0e-ac2d-477e-92ac-c4d1f12bcd75","56e501f9-1f82-4c52-845a-ac781801338a","Qwen2.5 Instruct 32B",{"aa_id":3436,"ppt_model_id":3437,"slug":1053,"model_name":1054,"provider_name":2706,"name":1054,"provider":2706,"aa_name":1054,"is_open":37,"author_country":2653,"release_date":1056,"release_month":1057,"context_length":1058,"inference_mode":2654,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":50,"input_price":251,"output_price":50,"tokens_per_second":3438,"time_to_first_token":3439,"benchmark_aime":3212,"benchmark_aime_25":2820,"benchmark_gpqa":3199,"benchmark_hle":2787,"benchmark_ifbench":2461,"benchmark_lcr":3419,"benchmark_livecodebench":121,"benchmark_math_hard":3119,"benchmark_mmlu_pro":1040,"benchmark_scicode":2098,"benchmark_tau2":3151,"benchmark_terminalbench":26,"benchmark_accountingaudit":1188,"benchmark_agieval_zh":12,"benchmark_agieval_en":3440,"benchmark_arc_challenge":3441,"benchmark_arc_easy":3179,"benchmark_bbeh":3442,"benchmark_bbh":3443,"benchmark_bfcl_v3":3444,"benchmark_bird_critic":12,"benchmark_darkbench":3445,"benchmark_formal_logic_exp":495,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3446,"benchmark_ifeval":3447,"benchmark_knights_and_knaves":3448,"benchmark_math":3449,"benchmark_mbppplus":2953,"benchmark_medqa":3450,"benchmark_mmlu":3451,"benchmark_mmmu":3452,"benchmark_multichallenge":12,"benchmark_simpleqa":3453,"benchmark_stock_bcs":2667,"benchmark_swe_bench_lite":69,"benchmark_wmdp":12,"benchmark_wmt":3454,"benchmark_intelligence":3005,"benchmark_coding":429},"61e1d147-56c0-44af-b21e-54853bf84000","f97674be-ce8a-49ec-a595-850219c04756",132.223,0.453,27.4479,93.942,19.4912,79.3294,55.6857,47.7273,81.0976,83.9187,30.7143,80.04,52.0031,24.5849,42.3333,7.3047,37.0825,{"aa_id":3456,"ppt_model_id":3457,"slug":1062,"model_name":1063,"provider_name":2706,"name":1063,"provider":2706,"aa_name":1063,"is_open":37,"author_country":2653,"release_date":1065,"release_month":1057,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":274,"input_price":273,"output_price":274,"tokens_per_second":3458,"time_to_first_token":3459,"benchmark_aime":1071,"benchmark_aime_25":3460,"benchmark_gpqa":3236,"benchmark_hle":3280,"benchmark_ifbench":1124,"benchmark_lcr":3461,"benchmark_livecodebench":1069,"benchmark_math_hard":1070,"benchmark_mmlu_pro":1066,"benchmark_scicode":2733,"benchmark_tau2":132,"benchmark_terminalbench":2753,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3462,"benchmark_arc_challenge":3463,"benchmark_arc_easy":3179,"benchmark_bbeh":3464,"benchmark_bbh":3465,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":2900,"benchmark_gaia":12,"benchmark_gsm8k":3182,"benchmark_humaneval":3466,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3467,"benchmark_math":3468,"benchmark_mbppplus":3469,"benchmark_medqa":3470,"benchmark_mmlu":3471,"benchmark_mmmu":3472,"benchmark_multichallenge":12,"benchmark_simpleqa":3473,"benchmark_stock_bcs":2667,"benchmark_swe_bench_lite":615,"benchmark_wmdp":12,"benchmark_wmt":3474,"benchmark_aider":1068,"benchmark_intelligence":3475,"benchmark_coding":1068},"d4f9e20b-30e2-42b5-b696-9a4179b68bf6","31f657d9-fcdf-4ab1-b895-a3c8fe06b863",124.182,0.557,19.3,46,76.6693,94.9659,25.6221,81.8154,84.7561,59.4286,86.8289,60.0529,78.3975,85.5434,31.3333,22.1452,37.9787,18.4,{"aa_id":12,"ppt_model_id":3477,"slug":1074,"model_name":1075,"provider_name":1076,"name":1075,"provider":1076,"aa_name":12,"is_open":11,"author_country":2653,"release_date":1078,"release_month":1057,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":3478,"benchmark_agieval_zh":3479,"benchmark_agieval_en":3480,"benchmark_arc_challenge":3369,"benchmark_arc_easy":3481,"benchmark_bbeh":12,"benchmark_bbh":3482,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":2294,"benchmark_gaia":12,"benchmark_gsm8k":3483,"benchmark_humaneval":3484,"benchmark_ifeval":12,"benchmark_knights_and_knaves":1158,"benchmark_math":3485,"benchmark_mbppplus":3486,"benchmark_medqa":3487,"benchmark_mmlu":12,"benchmark_mmmu":3488,"benchmark_multichallenge":12,"benchmark_simpleqa":3489,"benchmark_stock_bcs":497,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3490,"benchmark_wmt":12,"benchmark_aider":1079},"94d6d3ca-0fc8-4b1c-b5a5-6638819820ef",73.3333,71.4246,71.2883,99.032,53.8473,93.1193,91.4634,92.0039,58.4656,86.0958,49.1111,38.3033,74.3457,{"aa_id":12,"ppt_model_id":3492,"slug":1082,"model_name":1083,"provider_name":1076,"name":1083,"provider":1076,"aa_name":12,"is_open":11,"author_country":2653,"release_date":1085,"release_month":1057,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":25,"input_price":50,"output_price":25,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":3493,"benchmark_agieval_en":12,"benchmark_arc_challenge":3494,"benchmark_arc_easy":3495,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3496,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":3224,"benchmark_medqa":12,"benchmark_mmlu":3497,"benchmark_mmmu":3498,"benchmark_multichallenge":12,"benchmark_simpleqa":3499,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1086},"28b13def-723b-44d3-a9c9-a8addc41e218",77.3559,95.2218,98.8636,95.7317,89.154,52.4444,18.4004,{"aa_id":3501,"ppt_model_id":3502,"slug":1103,"model_name":1104,"provider_name":9,"name":1104,"provider":9,"aa_name":3503,"is_open":11,"author_country":2653,"release_date":1106,"release_month":1057,"context_length":1107,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"tokens_per_second":3504,"time_to_first_token":3505,"benchmark_aime":1113,"benchmark_aime_25":3506,"benchmark_gpqa":1109,"benchmark_hle":1875,"benchmark_ifbench":3507,"benchmark_lcr":2098,"benchmark_livecodebench":1111,"benchmark_math_hard":1112,"benchmark_mmlu_pro":1108,"benchmark_scicode":2788,"benchmark_tau2":2775,"benchmark_terminalbench":2934,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3506,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1110,"benchmark_intelligence":880,"benchmark_coding":1002},"0ddc315a-6a81-4ebb-853f-44dc4051e114","3451226e-b595-4158-a36c-e524bee5224b","GPT-4.1 nano",140.559,0.404,24,32,{"aa_id":3509,"ppt_model_id":3510,"slug":1116,"model_name":1117,"provider_name":9,"name":1117,"provider":9,"aa_name":3511,"is_open":11,"author_country":2653,"release_date":1119,"release_month":1057,"context_length":1107,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":524,"input_price":377,"output_price":524,"tokens_per_second":3512,"time_to_first_token":3513,"benchmark_aime":1124,"benchmark_aime_25":3514,"benchmark_gpqa":1121,"benchmark_hle":2776,"benchmark_ifbench":388,"benchmark_lcr":3515,"benchmark_livecodebench":201,"benchmark_math_hard":1123,"benchmark_mmlu_pro":3516,"benchmark_scicode":3517,"benchmark_tau2":3358,"benchmark_terminalbench":3413,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3518,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1122,"benchmark_intelligence":3519,"benchmark_coding":904},"2f55cded-9d13-4b9d-9ed0-f7e4055002f4","377f9d36-d123-48fc-8eda-1771e733612d","GPT-4.1 mini",67.202,0.531,46.300000000000004,42.3,78.10000000000001,40.400000000000006,46.3,22.9,{"aa_id":3521,"ppt_model_id":3522,"slug":1127,"model_name":1128,"provider_name":9,"name":1128,"provider":9,"aa_name":1128,"is_open":11,"author_country":2653,"release_date":1130,"release_month":1057,"context_length":1107,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"tokens_per_second":3523,"time_to_first_token":3524,"benchmark_aime":1136,"benchmark_aime_25":2837,"benchmark_gpqa":3525,"benchmark_hle":2776,"benchmark_ifbench":1124,"benchmark_lcr":1786,"benchmark_livecodebench":1134,"benchmark_math_hard":1135,"benchmark_mmlu_pro":3526,"benchmark_scicode":514,"benchmark_tau2":3052,"benchmark_terminalbench":3527,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":3528,"benchmark_agieval_en":3529,"benchmark_arc_challenge":3530,"benchmark_arc_easy":3481,"benchmark_bbeh":3531,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":3532,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3534,"benchmark_math":425,"benchmark_mbppplus":3535,"benchmark_medqa":3536,"benchmark_mmlu":3537,"benchmark_mmmu":3538,"benchmark_multichallenge":12,"benchmark_simpleqa":3539,"benchmark_stock_bcs":3136,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3540,"benchmark_wmt":3541,"benchmark_aider":1133,"benchmark_intelligence":1610,"benchmark_coding":783},"13c6f2c7-09d5-42a5-af53-b7c93ed11245","86211b9b-e2a7-4807-9d9c-97efc6e847d5",86.313,0.602,66.60000000000001,80.60000000000001,13.600000000000001,69.2905,70.0314,95.1365,17.6549,90.6,93.2927,77.1429,62.963,89.7093,84.5962,69.3333,40.4375,71.374,37.5762,{"aa_id":3543,"ppt_model_id":3544,"slug":1139,"model_name":1140,"provider_name":1833,"name":1140,"provider":1833,"aa_name":3545,"is_open":37,"author_country":2817,"release_date":1142,"release_month":1057,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":404,"input_price":207,"output_price":404,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":1146,"benchmark_aime_25":12,"benchmark_gpqa":3546,"benchmark_hle":3280,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":1144,"benchmark_math_hard":1145,"benchmark_mmlu_pro":892,"benchmark_scicode":2700,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":156},"41a5b11c-6ea8-455c-a923-63f1fc3db15d","dbef3256-4bd8-434c-9bed-61c9bfe0c5b5","Qwen2.5 Coder Instruct 7B ",33.900000000000006,{"aa_id":3548,"ppt_model_id":3549,"slug":1149,"model_name":1150,"provider_name":9,"name":1150,"provider":9,"aa_name":3550,"is_open":11,"author_country":2653,"release_date":1152,"release_month":1057,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":1153,"input_price":708,"output_price":1153,"tokens_per_second":3551,"time_to_first_token":3552,"benchmark_aime":1158,"benchmark_aime_25":1323,"benchmark_gpqa":1155,"benchmark_hle":3039,"benchmark_ifbench":749,"benchmark_lcr":3553,"benchmark_livecodebench":1156,"benchmark_math_hard":1157,"benchmark_mmlu_pro":1154,"benchmark_scicode":484,"benchmark_tau2":3554,"benchmark_terminalbench":1986,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1323,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":412,"benchmark_intelligence":2733,"benchmark_coding":3555},"6061e1ad-5631-4872-b856-171bd8c2b8b2","40b3d6fc-ac45-4e8c-b17b-67ba28f34a81","o4-mini (high)",128.562,21.715,55.00000000000001,55.60000000000001,25.6,{"aa_id":3557,"ppt_model_id":3558,"slug":1161,"model_name":1162,"provider_name":9,"name":1162,"provider":9,"aa_name":1162,"is_open":11,"author_country":2653,"release_date":1164,"release_month":1057,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"tokens_per_second":3559,"time_to_first_token":3560,"benchmark_aime":1169,"benchmark_aime_25":962,"benchmark_gpqa":3561,"benchmark_hle":436,"benchmark_ifbench":2945,"benchmark_lcr":1528,"benchmark_livecodebench":3562,"benchmark_math_hard":1168,"benchmark_mmlu_pro":994,"benchmark_scicode":810,"benchmark_tau2":1208,"benchmark_terminalbench":2022,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3563,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3564,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":962,"benchmark_mbppplus":3565,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1166,"benchmark_intelligence":3566,"benchmark_coding":3566},"824d8ef1-9b1b-45bd-b88c-7188de7758aa","d58ef503-cd4d-4f92-b991-f863fdc9640d",86.478,7.348,82.69999999999999,80.80000000000001,90.8877,89.5561,61.6402,38.4,{"aa_id":12,"ppt_model_id":3568,"slug":1172,"model_name":1173,"provider_name":9,"name":1173,"provider":9,"aa_name":12,"is_open":11,"author_country":2653,"release_date":1175,"release_month":1057,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":700,"output_price_per_1m_tokens":765,"input_price":700,"output_price":765,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3569,"benchmark_arc_challenge":3530,"benchmark_arc_easy":3096,"benchmark_bbeh":12,"benchmark_bbh":3570,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":3571,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3572,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3574,"benchmark_math":3575,"benchmark_mbppplus":3576,"benchmark_medqa":3577,"benchmark_mmlu":12,"benchmark_mmmu":3578,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":497,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"643c7666-865e-4d6d-880f-89d4cf579572",87.7703,82.0125,42.7921,95.9726,96.3415,99.6795,94.5741,64.2857,95.1817,79.156,{"aa_id":3580,"ppt_model_id":3581,"slug":1178,"model_name":3582,"provider_name":1833,"name":1179,"provider":1833,"aa_name":3582,"is_open":37,"author_country":2817,"release_date":1181,"release_month":1057,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":524,"input_price":536,"output_price":524,"tokens_per_second":3583,"time_to_first_token":3584,"benchmark_aime":1190,"benchmark_aime_25":1192,"benchmark_gpqa":1188,"benchmark_hle":2729,"benchmark_ifbench":118,"benchmark_lcr":2667,"benchmark_livecodebench":1189,"benchmark_math_hard":860,"benchmark_mmlu_pro":1187,"benchmark_scicode":3176,"benchmark_tau2":3506,"benchmark_terminalbench":2975,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":3585,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3586,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3587,"benchmark_humaneval":3588,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1113,"benchmark_mbppplus":3589,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3590,"benchmark_stock_bcs":3190,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1183,"benchmark_livecodebench_reasoning":1189,"benchmark_mmlu_pro_reasoning":1187,"benchmark_gpqa_reasoning":1188,"benchmark_math_hard_reasoning":860,"benchmark_aime_reasoning":1190,"benchmark_aime_25_reasoning":1192,"benchmark_hle_reasoning":280,"benchmark_scicode_reasoning":2164,"benchmark_ifbench_reasoning":118,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":2975,"benchmark_tau2_reasoning":3506,"benchmark_intelligence":2098,"benchmark_coding":439,"benchmark_intelligence_reasoning":200,"benchmark_coding_reasoning":1191,"benchmark_math_reasoning":1192},"dc235cf5-abbe-48f5-86f1-4f6b4912209e","6e0bfad3-751a-4392-87e1-17f2ceb51aea","Qwen3 235B A22B (Reasoning)",51.381,1.174,89.3729,84.2211,95.1613,90.2439,66.1677,12.7197,{"aa_id":3592,"ppt_model_id":3581,"slug":1178,"model_name":1179,"provider_name":1833,"name":1179,"provider":1833,"aa_name":3593,"is_open":37,"author_country":2817,"release_date":1181,"release_month":1057,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":524,"input_price":536,"output_price":524,"tokens_per_second":3594,"time_to_first_token":3595,"benchmark_aime":1186,"benchmark_aime_25":1113,"benchmark_gpqa":1182,"benchmark_hle":3012,"benchmark_ifbench":2906,"benchmark_lcr":2667,"benchmark_livecodebench":3596,"benchmark_math_hard":1185,"benchmark_mmlu_pro":781,"benchmark_scicode":121,"benchmark_tau2":3597,"benchmark_terminalbench":2975,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":3585,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3586,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3587,"benchmark_humaneval":3588,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1113,"benchmark_mbppplus":3589,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3590,"benchmark_stock_bcs":3190,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1183,"benchmark_livecodebench_reasoning":1189,"benchmark_mmlu_pro_reasoning":1187,"benchmark_gpqa_reasoning":1188,"benchmark_math_hard_reasoning":860,"benchmark_aime_reasoning":1190,"benchmark_aime_25_reasoning":1192,"benchmark_hle_reasoning":280,"benchmark_scicode_reasoning":2164,"benchmark_ifbench_reasoning":118,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":2975,"benchmark_tau2_reasoning":3506,"benchmark_intelligence":2098,"benchmark_coding":439,"benchmark_intelligence_reasoning":200,"benchmark_coding_reasoning":1191,"benchmark_math_reasoning":1192},"d4b339c6-2709-4e62-a440-bc39903208ef","Qwen3 235B A22B (Non-reasoning)",49.818,1.118,34.300000000000004,27.200000000000003,{"aa_id":3599,"ppt_model_id":3600,"slug":1195,"model_name":3601,"provider_name":1833,"name":1196,"provider":1833,"aa_name":3601,"is_open":37,"author_country":2817,"release_date":1198,"release_month":1057,"context_length":1199,"inference_mode":3250,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":622,"input_price":251,"output_price":622,"tokens_per_second":3602,"time_to_first_token":3603,"benchmark_aime":1208,"benchmark_aime_25":1211,"benchmark_gpqa":1205,"benchmark_hle":427,"benchmark_ifbench":2383,"benchmark_lcr":2667,"benchmark_livecodebench":1206,"benchmark_math_hard":1207,"benchmark_mmlu_pro":3604,"benchmark_scicode":3430,"benchmark_tau2":3605,"benchmark_terminalbench":68,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":3606,"benchmark_agieval_en":12,"benchmark_arc_challenge":3257,"benchmark_arc_easy":3607,"benchmark_bbeh":12,"benchmark_bbh":3608,"benchmark_bfcl_v3":3609,"benchmark_bird_critic":12,"benchmark_darkbench":3610,"benchmark_formal_logic_exp":12,"benchmark_gaia":3611,"benchmark_gsm8k":3612,"benchmark_humaneval":3496,"benchmark_ifeval":3613,"benchmark_knights_and_knaves":12,"benchmark_math":2295,"benchmark_mbppplus":3614,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":3615,"benchmark_multichallenge":12,"benchmark_simpleqa":3616,"benchmark_stock_bcs":1351,"benchmark_swe_bench_lite":3617,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1201,"benchmark_livecodebench_reasoning":1206,"benchmark_mmlu_pro_reasoning":1204,"benchmark_gpqa_reasoning":1205,"benchmark_math_hard_reasoning":1207,"benchmark_aime_reasoning":1208,"benchmark_aime_25_reasoning":1211,"benchmark_hle_reasoning":427,"benchmark_scicode_reasoning":3430,"benchmark_ifbench_reasoning":2383,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":68,"benchmark_tau2_reasoning":3618,"benchmark_intelligence":2768,"benchmark_intelligence_reasoning":1210,"benchmark_coding_reasoning":1209,"benchmark_math_reasoning":1211},"86822b45-0946-4fae-9240-461e90314d51","093ea70c-01f1-43df-9c9f-037e45e7ec5d","Qwen3 32B (Reasoning)",108.702,0.96,79.80000000000001,29.799999999999997,86.748,99.1162,85.824,75.6812,49.2424,12.3288,94.5578,81.3309,63.3803,52.0717,5.4785,16.3333,29.8,{"aa_id":3620,"ppt_model_id":3600,"slug":1195,"model_name":1196,"provider_name":1833,"name":1196,"provider":1833,"aa_name":3621,"is_open":37,"author_country":2817,"release_date":1198,"release_month":1057,"context_length":1199,"inference_mode":2654,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":622,"input_price":251,"output_price":622,"tokens_per_second":3622,"time_to_first_token":3623,"benchmark_aime":1203,"benchmark_aime_25":2295,"benchmark_gpqa":903,"benchmark_hle":2787,"benchmark_ifbench":3624,"benchmark_lcr":2667,"benchmark_livecodebench":3053,"benchmark_math_hard":1202,"benchmark_mmlu_pro":1200,"benchmark_scicode":3625,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":3606,"benchmark_agieval_en":12,"benchmark_arc_challenge":3257,"benchmark_arc_easy":3607,"benchmark_bbeh":12,"benchmark_bbh":3608,"benchmark_bfcl_v3":3609,"benchmark_bird_critic":12,"benchmark_darkbench":3610,"benchmark_formal_logic_exp":12,"benchmark_gaia":3611,"benchmark_gsm8k":3612,"benchmark_humaneval":3496,"benchmark_ifeval":3613,"benchmark_knights_and_knaves":12,"benchmark_math":2295,"benchmark_mbppplus":3614,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":3615,"benchmark_multichallenge":12,"benchmark_simpleqa":3616,"benchmark_stock_bcs":1351,"benchmark_swe_bench_lite":3617,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1201,"benchmark_livecodebench_reasoning":1206,"benchmark_mmlu_pro_reasoning":1204,"benchmark_gpqa_reasoning":1205,"benchmark_math_hard_reasoning":1207,"benchmark_aime_reasoning":1208,"benchmark_aime_25_reasoning":1211,"benchmark_hle_reasoning":427,"benchmark_scicode_reasoning":3430,"benchmark_ifbench_reasoning":2383,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":68,"benchmark_tau2_reasoning":3618,"benchmark_intelligence":2768,"benchmark_intelligence_reasoning":1210,"benchmark_coding_reasoning":1209,"benchmark_math_reasoning":1211},"f0f8ee02-5b18-4b09-a743-7c2a31a20c04","Qwen3 32B (Non-reasoning)",107.959,0.966,31.5,28.000000000000004,{"aa_id":3627,"ppt_model_id":3628,"slug":1214,"model_name":3629,"provider_name":1833,"name":1215,"provider":1833,"aa_name":3629,"is_open":37,"author_country":2817,"release_date":1217,"release_month":1057,"context_length":1199,"inference_mode":3250,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":377,"input_price":41,"output_price":377,"tokens_per_second":3630,"time_to_first_token":3631,"benchmark_aime":1224,"benchmark_aime_25":915,"benchmark_gpqa":768,"benchmark_hle":2787,"benchmark_ifbench":209,"benchmark_lcr":2667,"benchmark_livecodebench":3118,"benchmark_math_hard":1207,"benchmark_mmlu_pro":1222,"benchmark_scicode":2964,"benchmark_tau2":2071,"benchmark_terminalbench":2934,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3632,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3633,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1223,"benchmark_mmlu_pro_reasoning":1222,"benchmark_gpqa_reasoning":768,"benchmark_math_hard_reasoning":1207,"benchmark_aime_reasoning":1224,"benchmark_aime_25_reasoning":915,"benchmark_hle_reasoning":2787,"benchmark_scicode_reasoning":2964,"benchmark_ifbench_reasoning":209,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":2934,"benchmark_tau2_reasoning":2071,"benchmark_intelligence":2657,"benchmark_coding":3634,"benchmark_intelligence_reasoning":1226,"benchmark_coding_reasoning":1225,"benchmark_math_reasoning":915},"55f225fd-d44c-42eb-838b-bf09db8c220b","3754bb8c-7765-4275-9c3f-598a3e2f5bbc","Qwen3 14B (Reasoning)",64.787,0.998,84.6438,58,12.4,{"aa_id":3636,"ppt_model_id":3628,"slug":1214,"model_name":1215,"provider_name":1833,"name":1215,"provider":1833,"aa_name":3637,"is_open":37,"author_country":2817,"release_date":1217,"release_month":1057,"context_length":1199,"inference_mode":2654,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":377,"input_price":41,"output_price":377,"tokens_per_second":3638,"time_to_first_token":3639,"benchmark_aime":3625,"benchmark_aime_25":3640,"benchmark_gpqa":1219,"benchmark_hle":2752,"benchmark_ifbench":3641,"benchmark_lcr":2667,"benchmark_livecodebench":3625,"benchmark_math_hard":1221,"benchmark_mmlu_pro":1218,"benchmark_scicode":3411,"benchmark_tau2":1252,"benchmark_terminalbench":1146,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3632,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3633,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1223,"benchmark_mmlu_pro_reasoning":1222,"benchmark_gpqa_reasoning":768,"benchmark_math_hard_reasoning":1207,"benchmark_aime_reasoning":1224,"benchmark_aime_25_reasoning":915,"benchmark_hle_reasoning":2787,"benchmark_scicode_reasoning":2964,"benchmark_ifbench_reasoning":209,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":2934,"benchmark_tau2_reasoning":2071,"benchmark_intelligence":2657,"benchmark_coding":3634,"benchmark_intelligence_reasoning":1226,"benchmark_coding_reasoning":1225,"benchmark_math_reasoning":915},"e2795fc2-f2d7-4e34-8287-a1df8e954d8b","Qwen3 14B (Non-reasoning)",65.764,1.036,57.99999999999999,23.9,{"aa_id":3643,"ppt_model_id":3644,"slug":1229,"model_name":3645,"provider_name":1833,"name":1230,"provider":1833,"aa_name":3645,"is_open":37,"author_country":2817,"release_date":1232,"release_month":1057,"context_length":1199,"inference_mode":3250,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"tokens_per_second":3646,"time_to_first_token":3647,"benchmark_aime":653,"benchmark_aime_25":1243,"benchmark_gpqa":1238,"benchmark_hle":2752,"benchmark_ifbench":3648,"benchmark_lcr":2667,"benchmark_livecodebench":1239,"benchmark_math_hard":1240,"benchmark_mmlu_pro":1237,"benchmark_scicode":3327,"benchmark_tau2":3649,"benchmark_terminalbench":363,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1236,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1239,"benchmark_mmlu_pro_reasoning":1237,"benchmark_gpqa_reasoning":1238,"benchmark_math_hard_reasoning":1240,"benchmark_aime_reasoning":653,"benchmark_aime_25_reasoning":1243,"benchmark_hle_reasoning":2752,"benchmark_scicode_reasoning":3327,"benchmark_ifbench_reasoning":3648,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":363,"benchmark_tau2_reasoning":3650,"benchmark_intelligence":2812,"benchmark_coding":3651,"benchmark_intelligence_reasoning":1242,"benchmark_coding_reasoning":1241,"benchmark_math_reasoning":1243},"e5981e0b-6809-411a-8362-ad2c2bf15235","3f88d51e-d6cf-49e8-84c6-052c017c9845","Qwen3 8B (Reasoning)",82.989,0.922,33.5,27.800000000000004,27.8,7.1,{"aa_id":3653,"ppt_model_id":3644,"slug":1229,"model_name":1230,"provider_name":1833,"name":1230,"provider":1833,"aa_name":3654,"is_open":37,"author_country":2817,"release_date":1232,"release_month":1057,"context_length":1199,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"tokens_per_second":3655,"time_to_first_token":3656,"benchmark_aime":1236,"benchmark_aime_25":1236,"benchmark_gpqa":1234,"benchmark_hle":2669,"benchmark_ifbench":2789,"benchmark_lcr":2667,"benchmark_livecodebench":3657,"benchmark_math_hard":1187,"benchmark_mmlu_pro":1233,"benchmark_scicode":3658,"benchmark_tau2":3659,"benchmark_terminalbench":363,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1236,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1239,"benchmark_mmlu_pro_reasoning":1237,"benchmark_gpqa_reasoning":1238,"benchmark_math_hard_reasoning":1240,"benchmark_aime_reasoning":653,"benchmark_aime_25_reasoning":1243,"benchmark_hle_reasoning":2752,"benchmark_scicode_reasoning":3327,"benchmark_ifbench_reasoning":3648,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":363,"benchmark_tau2_reasoning":3650,"benchmark_intelligence":2812,"benchmark_coding":3651,"benchmark_intelligence_reasoning":1242,"benchmark_coding_reasoning":1241,"benchmark_math_reasoning":1243},"ac12a937-7d1d-4034-a876-164005fd1661","Qwen3 8B (Non-reasoning)",94.149,0.92,20.200000000000003,16.8,24.9,{"aa_id":3661,"ppt_model_id":3662,"slug":1246,"model_name":3663,"provider_name":1833,"name":1247,"provider":1833,"aa_name":3663,"is_open":37,"author_country":2817,"release_date":1249,"release_month":1057,"context_length":1199,"inference_mode":3250,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":1250,"input_price":251,"output_price":1250,"tokens_per_second":587,"time_to_first_token":3664,"benchmark_aime":1259,"benchmark_aime_25":656,"benchmark_gpqa":1256,"benchmark_hle":2668,"benchmark_ifbench":3665,"benchmark_lcr":2667,"benchmark_livecodebench":1257,"benchmark_math_hard":3666,"benchmark_mmlu_pro":1255,"benchmark_scicode":3667,"benchmark_tau2":1254,"benchmark_terminalbench":363,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":3668,"benchmark_agieval_en":3669,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3670,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3671,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3672,"benchmark_mbppplus":3673,"benchmark_medqa":3674,"benchmark_mmlu":3675,"benchmark_mmmu":3676,"benchmark_multichallenge":12,"benchmark_simpleqa":3677,"benchmark_stock_bcs":3190,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1257,"benchmark_mmlu_pro_reasoning":1255,"benchmark_gpqa_reasoning":1256,"benchmark_math_hard_reasoning":1258,"benchmark_aime_reasoning":1259,"benchmark_aime_25_reasoning":656,"benchmark_hle_reasoning":120,"benchmark_scicode_reasoning":3678,"benchmark_ifbench_reasoning":3665,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":363,"benchmark_tau2_reasoning":1254,"benchmark_intelligence":2094,"benchmark_coding":3679,"benchmark_intelligence_reasoning":1260,"benchmark_coding_reasoning":448,"benchmark_math_reasoning":656},"e1a843ea-dbd0-493f-aeab-47c1f4ab9b5b","125eee7e-5c10-4f90-b6bd-9d583e639d1c","Qwen3 30B A3B (Reasoning)",1.043,41.5,95.89999999999999,28.499999999999996,85.4767,83.0897,89.5254,94.1176,93.0046,62.6039,85.3103,85.2656,49,5.6403,28.5,13.3,{"aa_id":3681,"ppt_model_id":3662,"slug":1246,"model_name":1247,"provider_name":1833,"name":1247,"provider":1833,"aa_name":3682,"is_open":37,"author_country":2817,"release_date":1249,"release_month":1057,"context_length":1199,"inference_mode":2654,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":1250,"input_price":251,"output_price":1250,"tokens_per_second":3683,"time_to_first_token":3684,"benchmark_aime":1254,"benchmark_aime_25":3211,"benchmark_gpqa":130,"benchmark_hle":2776,"benchmark_ifbench":2694,"benchmark_lcr":2667,"benchmark_livecodebench":1252,"benchmark_math_hard":1253,"benchmark_mmlu_pro":1251,"benchmark_scicode":3167,"benchmark_tau2":1420,"benchmark_terminalbench":2753,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":3668,"benchmark_agieval_en":3669,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3670,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3671,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3672,"benchmark_mbppplus":3673,"benchmark_medqa":3674,"benchmark_mmlu":3675,"benchmark_mmmu":3676,"benchmark_multichallenge":12,"benchmark_simpleqa":3677,"benchmark_stock_bcs":3190,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1257,"benchmark_mmlu_pro_reasoning":1255,"benchmark_gpqa_reasoning":1256,"benchmark_math_hard_reasoning":1258,"benchmark_aime_reasoning":1259,"benchmark_aime_25_reasoning":656,"benchmark_hle_reasoning":120,"benchmark_scicode_reasoning":3678,"benchmark_ifbench_reasoning":3665,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":363,"benchmark_tau2_reasoning":1254,"benchmark_intelligence":2094,"benchmark_coding":3679,"benchmark_intelligence_reasoning":1260,"benchmark_coding_reasoning":448,"benchmark_math_reasoning":656},"5d9049c5-693c-4566-9202-b6f8587fb917","Qwen3 30B A3B (Non-reasoning)",68.454,0.991,{"aa_id":3686,"ppt_model_id":3687,"slug":1263,"model_name":3688,"provider_name":1833,"name":1264,"provider":1833,"aa_name":3689,"is_open":37,"author_country":2817,"release_date":1266,"release_month":1057,"context_length":1199,"inference_mode":3250,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":317,"benchmark_aime_25":3561,"benchmark_gpqa":3690,"benchmark_hle":3691,"benchmark_ifbench":635,"benchmark_lcr":3692,"benchmark_livecodebench":1897,"benchmark_math_hard":1268,"benchmark_mmlu_pro":1237,"benchmark_scicode":3555,"benchmark_tau2":1511,"benchmark_terminalbench":26,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":484,"benchmark_mmlu_pro_reasoning":1269,"benchmark_gpqa_reasoning":1270,"benchmark_math_hard_reasoning":1271,"benchmark_aime_reasoning":1108,"benchmark_aime_25_reasoning":890,"benchmark_hle_reasoning":2719,"benchmark_scicode_reasoning":3693,"benchmark_ifbench_reasoning":1944,"benchmark_lcr_reasoning":2667,"benchmark_tau2_reasoning":1243,"benchmark_intelligence":2094,"benchmark_intelligence_reasoning":1272,"benchmark_math_reasoning":890},"1130b9ab-5e0b-4f39-8931-ebad4783816a","9f41bae3-5eaf-401e-8255-3d680bb18307","Qwen3 4B (Reasoning)","Qwen3 4B 2507 (Reasoning)",66.7,5.8999999999999995,37.7,3.5,{"aa_id":3695,"ppt_model_id":3687,"slug":1263,"model_name":3688,"provider_name":1833,"name":1264,"provider":1833,"aa_name":3688,"is_open":37,"author_country":2817,"release_date":1266,"release_month":1057,"context_length":1199,"inference_mode":3250,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":3696,"time_to_first_token":1828,"benchmark_aime":1108,"benchmark_aime_25":890,"benchmark_gpqa":1270,"benchmark_hle":2719,"benchmark_ifbench":1944,"benchmark_lcr":2667,"benchmark_livecodebench":484,"benchmark_math_hard":3697,"benchmark_mmlu_pro":1269,"benchmark_scicode":2912,"benchmark_tau2":1243,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":484,"benchmark_mmlu_pro_reasoning":1269,"benchmark_gpqa_reasoning":1270,"benchmark_math_hard_reasoning":1271,"benchmark_aime_reasoning":1108,"benchmark_aime_25_reasoning":890,"benchmark_hle_reasoning":2719,"benchmark_scicode_reasoning":3693,"benchmark_ifbench_reasoning":1944,"benchmark_lcr_reasoning":2667,"benchmark_tau2_reasoning":1243,"benchmark_intelligence":2094,"benchmark_intelligence_reasoning":1272,"benchmark_math_reasoning":890},"65e9ca6e-fcce-4ee7-9cdc-c172963c1594",102.857,93.30000000000001,{"aa_id":3699,"ppt_model_id":3687,"slug":1263,"model_name":1264,"provider_name":1833,"name":1264,"provider":1833,"aa_name":3700,"is_open":37,"author_country":2817,"release_date":1266,"release_month":1057,"context_length":1199,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":317,"benchmark_aime_25":3118,"benchmark_gpqa":3701,"benchmark_hle":3012,"benchmark_ifbench":3648,"benchmark_lcr":3148,"benchmark_livecodebench":3692,"benchmark_math_hard":1268,"benchmark_mmlu_pro":1661,"benchmark_scicode":3702,"benchmark_tau2":723,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":484,"benchmark_mmlu_pro_reasoning":1269,"benchmark_gpqa_reasoning":1270,"benchmark_math_hard_reasoning":1271,"benchmark_aime_reasoning":1108,"benchmark_aime_25_reasoning":890,"benchmark_hle_reasoning":2719,"benchmark_scicode_reasoning":3693,"benchmark_ifbench_reasoning":1944,"benchmark_lcr_reasoning":2667,"benchmark_tau2_reasoning":1243,"benchmark_intelligence":2094,"benchmark_intelligence_reasoning":1272,"benchmark_math_reasoning":890},"37210287-496c-402a-b583-00094b7a9532","Qwen3 4B 2507 Instruct",51.7,18.099999999999998,{"aa_id":3704,"ppt_model_id":3687,"slug":1263,"model_name":1264,"provider_name":1833,"name":1264,"provider":1833,"aa_name":3705,"is_open":37,"author_country":2817,"release_date":1266,"release_month":1057,"context_length":1199,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":3706,"time_to_first_token":2392,"benchmark_aime":317,"benchmark_aime_25":12,"benchmark_gpqa":3238,"benchmark_hle":3403,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":603,"benchmark_math_hard":1268,"benchmark_mmlu_pro":3707,"benchmark_scicode":625,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":484,"benchmark_mmlu_pro_reasoning":1269,"benchmark_gpqa_reasoning":1270,"benchmark_math_hard_reasoning":1271,"benchmark_aime_reasoning":1108,"benchmark_aime_25_reasoning":890,"benchmark_hle_reasoning":2719,"benchmark_scicode_reasoning":3693,"benchmark_ifbench_reasoning":1944,"benchmark_lcr_reasoning":2667,"benchmark_tau2_reasoning":1243,"benchmark_intelligence":2094,"benchmark_intelligence_reasoning":1272,"benchmark_math_reasoning":890},"21024d57-f23b-4bdb-886b-44db88312bca","Qwen3 4B (Non-reasoning)",105.474,58.599999999999994,{"aa_id":3709,"ppt_model_id":3710,"slug":1309,"model_name":1310,"provider_name":248,"name":1310,"provider":248,"aa_name":3711,"is_open":11,"author_country":2653,"release_date":1312,"release_month":1287,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":1268,"benchmark_aime_25":12,"benchmark_gpqa":3712,"benchmark_hle":147,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":771,"benchmark_math_hard":1315,"benchmark_mmlu_pro":891,"benchmark_scicode":3713,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":3255,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3714,"benchmark_humaneval":3183,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":3535,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1314,"benchmark_intelligence":556},"ac7c8215-33d4-4608-b669-021d389f50ab","df753776-5b08-40e4-b68a-190e641c093d","Gemini 2.5 Pro Preview (May' 25)",82.19999999999999,41.6,87.0356,{"aa_id":3716,"ppt_model_id":3717,"slug":1318,"model_name":1319,"provider_name":2665,"name":1319,"provider":2665,"aa_name":1319,"is_open":11,"author_country":2666,"release_date":1321,"release_month":1287,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"tokens_per_second":3718,"time_to_first_token":117,"benchmark_aime":1324,"benchmark_aime_25":1203,"benchmark_gpqa":933,"benchmark_hle":2787,"benchmark_ifbench":3237,"benchmark_lcr":3625,"benchmark_livecodebench":1201,"benchmark_math_hard":1323,"benchmark_mmlu_pro":1322,"benchmark_scicode":2733,"benchmark_tau2":1236,"benchmark_terminalbench":2934,"benchmark_accountingaudit":3478,"benchmark_agieval_zh":3719,"benchmark_agieval_en":3720,"benchmark_arc_challenge":3721,"benchmark_arc_easy":3722,"benchmark_bbeh":3723,"benchmark_bbh":3724,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3725,"benchmark_humaneval":3345,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3726,"benchmark_math":3727,"benchmark_mbppplus":3728,"benchmark_medqa":3729,"benchmark_mmlu":3730,"benchmark_mmmu":3731,"benchmark_multichallenge":12,"benchmark_simpleqa":3732,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":361,"benchmark_coding":3229},"d72690cb-273d-465c-b762-90dd1a834a7c","13d794fe-567e-4823-88ee-f9ed01ead977",66.55,74.2239,70.2671,93.43,99.0741,14.1014,81.4727,94.1622,60.7069,84.2062,54.4974,79.1045,82.5595,58.6667,19.718,{"aa_id":3734,"ppt_model_id":3735,"slug":1327,"model_name":1328,"provider_name":248,"name":1328,"provider":248,"aa_name":3736,"is_open":37,"author_country":2653,"release_date":1330,"release_month":1287,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":288,"output_price_per_1m_tokens":208,"input_price":288,"output_price":208,"tokens_per_second":3737,"time_to_first_token":3738,"benchmark_aime":3338,"benchmark_aime_25":3089,"benchmark_gpqa":2718,"benchmark_hle":2710,"benchmark_ifbench":3739,"benchmark_lcr":2667,"benchmark_livecodebench":1332,"benchmark_math_hard":2905,"benchmark_mmlu_pro":1331,"benchmark_scicode":3740,"benchmark_tau2":505,"benchmark_terminalbench":363,"benchmark_accountingaudit":3741,"benchmark_agieval_zh":12,"benchmark_agieval_en":3742,"benchmark_arc_challenge":3743,"benchmark_arc_easy":3744,"benchmark_bbeh":12,"benchmark_bbh":3745,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3746,"benchmark_humaneval":3747,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3748,"benchmark_math":691,"benchmark_mbppplus":3749,"benchmark_medqa":3750,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3751,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2722,"benchmark_coding":2752},"8bbd01e4-5e16-4ad6-8fd6-c22ac7828d03","e7ce5407-3809-4a4b-b009-dddb363915a7","Gemma 3n E4B Instruct",29.518,0.278,27.900000000000002,8.1,43.3333,53.1422,81.7406,93.3923,72.7384,88.9226,73.1707,40.5714,55.8201,54.2027,4.0222,{"aa_id":3753,"ppt_model_id":3754,"slug":1335,"model_name":3755,"provider_name":138,"name":1336,"provider":138,"aa_name":3756,"is_open":11,"author_country":2653,"release_date":1338,"release_month":1287,"context_length":142,"inference_mode":3250,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":3757,"time_to_first_token":3758,"benchmark_aime":638,"benchmark_aime_25":1237,"benchmark_gpqa":1255,"benchmark_hle":211,"benchmark_ifbench":3254,"benchmark_lcr":3759,"benchmark_livecodebench":1342,"benchmark_math_hard":1343,"benchmark_mmlu_pro":513,"benchmark_scicode":1201,"benchmark_tau2":3760,"benchmark_terminalbench":3761,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3762,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":3763,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3764,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3765,"benchmark_mbppplus":3766,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1182,"benchmark_livecodebench_reasoning":1342,"benchmark_mmlu_pro_reasoning":513,"benchmark_gpqa_reasoning":1255,"benchmark_math_hard_reasoning":1343,"benchmark_aime_reasoning":638,"benchmark_aime_25_reasoning":1237,"benchmark_hle_reasoning":211,"benchmark_scicode_reasoning":1201,"benchmark_ifbench_reasoning":3254,"benchmark_lcr_reasoning":3759,"benchmark_terminalbench_reasoning":3761,"benchmark_tau2_reasoning":2021,"benchmark_intelligence":861,"benchmark_coding":3767,"benchmark_intelligence_reasoning":118,"benchmark_coding_reasoning":1344,"benchmark_math_reasoning":1237},"54b687fd-0a00-4aea-8758-f20a2e7befc9","a999a4ed-59c8-43b5-9e07-6bad07c18529","Claude Sonnet 4 (Reasoning)","Claude 4 Sonnet (Reasoning)",44.892,8.371,64.7,64.60000000000001,31.1,83.9356,34.6681,95.6785,90.32,62.1693,30.6,{"aa_id":3769,"ppt_model_id":3754,"slug":1335,"model_name":1336,"provider_name":138,"name":1336,"provider":138,"aa_name":3770,"is_open":11,"author_country":2653,"release_date":1338,"release_month":1287,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":3771,"time_to_first_token":3772,"benchmark_aime":3773,"benchmark_aime_25":3774,"benchmark_gpqa":2965,"benchmark_hle":69,"benchmark_ifbench":1022,"benchmark_lcr":3775,"benchmark_livecodebench":1339,"benchmark_math_hard":1340,"benchmark_mmlu_pro":891,"benchmark_scicode":3776,"benchmark_tau2":3118,"benchmark_terminalbench":3777,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3762,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":3763,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3764,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3765,"benchmark_mbppplus":3766,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1182,"benchmark_livecodebench_reasoning":1342,"benchmark_mmlu_pro_reasoning":513,"benchmark_gpqa_reasoning":1255,"benchmark_math_hard_reasoning":1343,"benchmark_aime_reasoning":638,"benchmark_aime_25_reasoning":1237,"benchmark_hle_reasoning":211,"benchmark_scicode_reasoning":1201,"benchmark_ifbench_reasoning":3254,"benchmark_lcr_reasoning":3759,"benchmark_terminalbench_reasoning":3761,"benchmark_tau2_reasoning":2021,"benchmark_intelligence":861,"benchmark_coding":3767,"benchmark_intelligence_reasoning":118,"benchmark_coding_reasoning":1344,"benchmark_math_reasoning":1237},"d6800cdb-3c12-439f-917b-95b0d19e0d16","Claude 4 Sonnet (Non-reasoning)",45.423,0.996,40.699999999999996,38,44.3,37.3,27.3,{"aa_id":3779,"ppt_model_id":3780,"slug":1347,"model_name":3781,"provider_name":138,"name":1348,"provider":138,"aa_name":3782,"is_open":11,"author_country":2653,"release_date":1350,"release_month":1287,"context_length":142,"inference_mode":3250,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1351,"input_price":161,"output_price":1351,"tokens_per_second":3783,"time_to_first_token":3784,"benchmark_aime":1356,"benchmark_aime_25":487,"benchmark_gpqa":3785,"benchmark_hle":2729,"benchmark_ifbench":183,"benchmark_lcr":917,"benchmark_livecodebench":1354,"benchmark_math_hard":1355,"benchmark_mmlu_pro":905,"benchmark_scicode":3238,"benchmark_tau2":869,"benchmark_terminalbench":3761,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3786,"benchmark_arc_challenge":12,"benchmark_arc_easy":3787,"benchmark_bbeh":3788,"benchmark_bbh":12,"benchmark_bfcl_v3":3789,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3790,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3791,"benchmark_mbppplus":3792,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":412,"benchmark_livecodebench_reasoning":1354,"benchmark_mmlu_pro_reasoning":905,"benchmark_gpqa_reasoning":1353,"benchmark_math_hard_reasoning":1355,"benchmark_aime_reasoning":1356,"benchmark_aime_25_reasoning":487,"benchmark_hle_reasoning":280,"benchmark_scicode_reasoning":1267,"benchmark_ifbench_reasoning":183,"benchmark_lcr_reasoning":917,"benchmark_terminalbench_reasoning":3761,"benchmark_tau2_reasoning":869,"benchmark_intelligence":861,"benchmark_intelligence_reasoning":1071,"benchmark_coding_reasoning":1357,"benchmark_math_reasoning":487},"c4da6054-33a4-4bdc-9336-cff162183766","09439faa-298a-48bc-97b6-3f6b92e0db6a","Claude Opus 4 (Reasoning)","Claude 4 Opus (Reasoning)",36.75,7.259,79.60000000000001,82.0039,99.6956,38.3517,25.2646,96.2064,91.22,63.3598,{"aa_id":3794,"ppt_model_id":3780,"slug":1347,"model_name":1348,"provider_name":138,"name":1348,"provider":138,"aa_name":3795,"is_open":11,"author_country":2653,"release_date":1350,"release_month":1287,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1351,"input_price":161,"output_price":1351,"tokens_per_second":3796,"time_to_first_token":3797,"benchmark_aime":894,"benchmark_aime_25":2383,"benchmark_gpqa":566,"benchmark_hle":3691,"benchmark_ifbench":624,"benchmark_lcr":2337,"benchmark_livecodebench":1352,"benchmark_math_hard":748,"benchmark_mmlu_pro":871,"benchmark_scicode":326,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3786,"benchmark_arc_challenge":12,"benchmark_arc_easy":3787,"benchmark_bbeh":3788,"benchmark_bbh":12,"benchmark_bfcl_v3":3789,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3790,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3791,"benchmark_mbppplus":3792,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":412,"benchmark_livecodebench_reasoning":1354,"benchmark_mmlu_pro_reasoning":905,"benchmark_gpqa_reasoning":1353,"benchmark_math_hard_reasoning":1355,"benchmark_aime_reasoning":1356,"benchmark_aime_25_reasoning":487,"benchmark_hle_reasoning":280,"benchmark_scicode_reasoning":1267,"benchmark_ifbench_reasoning":183,"benchmark_lcr_reasoning":917,"benchmark_terminalbench_reasoning":3761,"benchmark_tau2_reasoning":869,"benchmark_intelligence":861,"benchmark_intelligence_reasoning":1071,"benchmark_coding_reasoning":1357,"benchmark_math_reasoning":487},"2e57ec02-387f-401a-bdc1-d1c6f36c020c","Claude 4 Opus (Non-reasoning)",34.335,1.439,{"aa_id":3799,"ppt_model_id":3800,"slug":1360,"model_name":1361,"provider_name":3115,"name":1361,"provider":3115,"aa_name":3801,"is_open":11,"author_country":2817,"release_date":1363,"release_month":1287,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":1364,"output_price_per_1m_tokens":1365,"input_price":1364,"output_price":1365,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":973,"benchmark_aime_25":1322,"benchmark_gpqa":1166,"benchmark_hle":3802,"benchmark_ifbench":3803,"benchmark_lcr":3254,"benchmark_livecodebench":771,"benchmark_math_hard":1367,"benchmark_mmlu_pro":3804,"benchmark_scicode":3253,"benchmark_tau2":1644,"benchmark_terminalbench":2907,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":3805,"benchmark_arc_challenge":3806,"benchmark_arc_easy":3807,"benchmark_bbeh":12,"benchmark_bbh":3808,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":1168,"benchmark_gaia":3809,"benchmark_gsm8k":3810,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3811,"benchmark_math":1322,"benchmark_mbppplus":3812,"benchmark_medqa":12,"benchmark_mmlu":3813,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3814,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":569,"benchmark_intelligence":2935,"benchmark_coding":3506},"61ca0533-544d-47f7-bf98-a6cbe0ba2177","a373bb91-7d66-43d8-bc7f-c8c7f6b598b8","DeepSeek R1 0528 (May '25)",14.899999999999999,39.6,84.89999999999999,89.0157,95.1324,98.6532,87.9435,27.8788,95.2995,97.8571,59.5238,90.5349,25.0816,{"aa_id":3816,"ppt_model_id":3817,"slug":1370,"model_name":1371,"provider_name":248,"name":1371,"provider":248,"aa_name":3818,"is_open":11,"author_country":2653,"release_date":1373,"release_month":1374,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":1379,"benchmark_aime_25":12,"benchmark_gpqa":1375,"benchmark_hle":3819,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":1377,"benchmark_math_hard":1378,"benchmark_mmlu_pro":416,"benchmark_scicode":2461,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1376,"benchmark_intelligence":1203,"benchmark_coding":1454},"fc7ea66a-d820-4935-9a4e-00c53d5ca36a","334e9056-3431-4882-a09d-41211e49f61b","Gemini 2.5 Pro Preview (Mar' 25)",17.1,{"aa_id":3821,"ppt_model_id":3822,"slug":1382,"model_name":1383,"provider_name":3823,"name":1383,"provider":3823,"aa_name":1383,"is_open":11,"author_country":2653,"release_date":1385,"release_month":1374,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":3824,"time_to_first_token":3825,"benchmark_aime":861,"benchmark_aime_25":3640,"benchmark_gpqa":1528,"benchmark_hle":2719,"benchmark_ifbench":3826,"benchmark_lcr":3254,"benchmark_livecodebench":2422,"benchmark_math_hard":1379,"benchmark_mmlu_pro":2293,"benchmark_scicode":3827,"benchmark_tau2":1331,"benchmark_terminalbench":3121,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":3828,"benchmark_arc_challenge":3829,"benchmark_arc_easy":3722,"benchmark_bbeh":3830,"benchmark_bbh":3831,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3832,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":3833,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3834,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1899},"54548730-10f4-4002-8519-978dc55a3b13","1f2d1466-306e-4d55-8086-c3f485624e8b","xAI",68.962,0.354,46.9,36.8,71.1705,93.8567,18.031,53.3501,90.8537,58.7302,37.4249,{"aa_id":3836,"ppt_model_id":3822,"slug":1382,"model_name":1383,"provider_name":3823,"name":1383,"provider":3823,"aa_name":3837,"is_open":11,"author_country":2653,"release_date":1385,"release_month":1374,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":3828,"benchmark_arc_challenge":3829,"benchmark_arc_easy":3722,"benchmark_bbeh":3830,"benchmark_bbh":3831,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3832,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":3833,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3834,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1899},"6627d464-2e65-4665-a340-bb0193d2a25c","Grok 3 Reasoning Beta",{"aa_id":3839,"ppt_model_id":3840,"slug":1388,"model_name":1389,"provider_name":3823,"name":1389,"provider":3823,"aa_name":3841,"is_open":11,"author_country":2653,"release_date":1391,"release_month":1374,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":25,"input_price":143,"output_price":25,"tokens_per_second":3842,"time_to_first_token":3843,"benchmark_aime":3697,"benchmark_aime_25":1844,"benchmark_gpqa":3175,"benchmark_hle":1636,"benchmark_ifbench":3844,"benchmark_lcr":3845,"benchmark_livecodebench":1269,"benchmark_math_hard":1168,"benchmark_mmlu_pro":1187,"benchmark_scicode":1239,"benchmark_tau2":1240,"benchmark_terminalbench":1191,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3846,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1844,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3847,"benchmark_coding":757},"672a5322-b764-4492-8700-a8599063c496","a000c5fb-9106-4bec-bb8f-1445078bfc2e","Grok 3 mini Reasoning (high)",198.024,0.344,45.9,50.3,85.1532,32.1,{"aa_id":3849,"ppt_model_id":3850,"slug":1394,"model_name":1395,"provider_name":9,"name":1395,"provider":9,"aa_name":3851,"is_open":11,"author_country":2653,"release_date":1397,"release_month":1374,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":436,"output_price_per_1m_tokens":1398,"input_price":436,"output_price":1398,"tokens_per_second":3852,"time_to_first_token":3853,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1399,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1366,"benchmark_intelligence":1341},"11e1a619-e27c-4253-80ae-6e6bf1476a25","0a338e02-ece0-4abe-8680-469cfcbb02f9","o3-pro",23.393,82.833,{"aa_id":3855,"ppt_model_id":3856,"slug":1402,"model_name":1403,"provider_name":248,"name":1403,"provider":248,"aa_name":1403,"is_open":11,"author_country":2653,"release_date":1405,"release_month":1374,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":156,"input_price":61,"output_price":156,"tokens_per_second":3857,"time_to_first_token":3858,"benchmark_aime":1042,"benchmark_aime_25":1500,"benchmark_gpqa":3119,"benchmark_hle":2684,"benchmark_ifbench":3147,"benchmark_lcr":1145,"benchmark_livecodebench":3859,"benchmark_math_hard":1408,"benchmark_mmlu_pro":1406,"benchmark_scicode":959,"benchmark_tau2":602,"benchmark_terminalbench":3411,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3860,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3861,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":2765,"benchmark_gsm8k":3764,"benchmark_humaneval":12,"benchmark_ifeval":3862,"benchmark_knights_and_knaves":12,"benchmark_math":710,"benchmark_mbppplus":3535,"benchmark_medqa":3863,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3864,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1201,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2263,"benchmark_coding":3865},"05f7d45c-34e4-4600-a7db-61398e3f90a3","8d530051-07bc-4238-97a0-2e2ebe72724a",116.251,21.834,80.10000000000001,91.0841,88.7268,90.7579,94.5797,52.982,31.9,{"aa_id":3867,"ppt_model_id":3868,"slug":1411,"model_name":3869,"provider_name":248,"name":1412,"provider":248,"aa_name":3869,"is_open":11,"author_country":2653,"release_date":1414,"release_month":1374,"context_length":856,"inference_mode":3250,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":220,"input_price":50,"output_price":220,"tokens_per_second":3870,"time_to_first_token":3871,"benchmark_aime":1419,"benchmark_aime_25":487,"benchmark_gpqa":944,"benchmark_hle":1636,"benchmark_ifbench":3845,"benchmark_lcr":712,"benchmark_livecodebench":1417,"benchmark_math_hard":1418,"benchmark_mmlu_pro":1154,"benchmark_scicode":148,"benchmark_tau2":2964,"benchmark_terminalbench":3527,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":3872,"benchmark_arc_challenge":12,"benchmark_arc_easy":3873,"benchmark_bbeh":12,"benchmark_bbh":3874,"benchmark_bfcl_v3":12,"benchmark_bird_critic":3259,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3875,"benchmark_humaneval":12,"benchmark_ifeval":3876,"benchmark_knights_and_knaves":12,"benchmark_math":2262,"benchmark_mbppplus":3877,"benchmark_medqa":12,"benchmark_mmlu":3878,"benchmark_mmmu":2483,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":3272,"benchmark_swe_bench_lite":3879,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1041,"benchmark_livecodebench_reasoning":1417,"benchmark_mmlu_pro_reasoning":1154,"benchmark_gpqa_reasoning":944,"benchmark_math_hard_reasoning":1418,"benchmark_aime_reasoning":1419,"benchmark_aime_25_reasoning":487,"benchmark_hle_reasoning":1636,"benchmark_scicode_reasoning":148,"benchmark_ifbench_reasoning":3845,"benchmark_lcr_reasoning":712,"benchmark_terminalbench_reasoning":3229,"benchmark_tau2_reasoning":2964,"benchmark_intelligence":3880,"benchmark_coding":132,"benchmark_intelligence_reasoning":747,"benchmark_coding_reasoning":1420,"benchmark_math_reasoning":487},"ee29b2f6-6eae-4c74-9a5b-4f7b612e9758","4459d77d-e75d-4765-9abf-98ea3c2c4ed3","Gemini 2.5 Flash (Reasoning)",213.382,14.027,74.1948,98.9057,61.5519,79.0751,84.2884,57.672,85.7499,26.087,20.6,{"aa_id":3882,"ppt_model_id":3868,"slug":1411,"model_name":1412,"provider_name":248,"name":1412,"provider":248,"aa_name":3883,"is_open":11,"author_country":2653,"release_date":1414,"release_month":1374,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":220,"input_price":50,"output_price":220,"tokens_per_second":3884,"time_to_first_token":3885,"benchmark_aime":497,"benchmark_aime_25":2262,"benchmark_gpqa":2965,"benchmark_hle":2719,"benchmark_ifbench":1071,"benchmark_lcr":3844,"benchmark_livecodebench":1415,"benchmark_math_hard":1416,"benchmark_mmlu_pro":1066,"benchmark_scicode":2692,"benchmark_tau2":3802,"benchmark_terminalbench":3245,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":3872,"benchmark_arc_challenge":12,"benchmark_arc_easy":3873,"benchmark_bbeh":12,"benchmark_bbh":3874,"benchmark_bfcl_v3":12,"benchmark_bird_critic":3259,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3875,"benchmark_humaneval":12,"benchmark_ifeval":3876,"benchmark_knights_and_knaves":12,"benchmark_math":2262,"benchmark_mbppplus":3877,"benchmark_medqa":12,"benchmark_mmlu":3878,"benchmark_mmmu":2483,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":3272,"benchmark_swe_bench_lite":3879,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1041,"benchmark_livecodebench_reasoning":1417,"benchmark_mmlu_pro_reasoning":1154,"benchmark_gpqa_reasoning":944,"benchmark_math_hard_reasoning":1418,"benchmark_aime_reasoning":1419,"benchmark_aime_25_reasoning":487,"benchmark_hle_reasoning":1636,"benchmark_scicode_reasoning":148,"benchmark_ifbench_reasoning":3845,"benchmark_lcr_reasoning":712,"benchmark_terminalbench_reasoning":3229,"benchmark_tau2_reasoning":2964,"benchmark_intelligence":3880,"benchmark_coding":132,"benchmark_intelligence_reasoning":747,"benchmark_coding_reasoning":1420,"benchmark_math_reasoning":487},"3fa87a47-fcca-4724-93ec-915acd940f3a","Gemini 2.5 Flash (Non-reasoning)",214.705,0.419,{"aa_id":3887,"ppt_model_id":3888,"slug":1423,"model_name":1424,"provider_name":3889,"name":1424,"provider":3889,"aa_name":3890,"is_open":37,"author_country":2817,"release_date":1426,"release_month":1374,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":1427,"input_price":536,"output_price":1427,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":1166,"benchmark_aime_25":3338,"benchmark_gpqa":1428,"benchmark_hle":99,"benchmark_ifbench":3891,"benchmark_lcr":3701,"benchmark_livecodebench":1108,"benchmark_math_hard":1429,"benchmark_mmlu_pro":3562,"benchmark_scicode":3892,"benchmark_tau2":2964,"benchmark_terminalbench":363,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":3893,"benchmark_arc_challenge":3894,"benchmark_arc_easy":3895,"benchmark_bbeh":12,"benchmark_bbh":3896,"benchmark_bfcl_v3":3897,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3070,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":961,"benchmark_mbppplus":3105,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3898,"benchmark_coding":3899},"736203a8-500f-4eb6-8055-ebc2d96c3e6e","339acafb-9735-41ab-a6a8-1625e08c9312","MiniMax","MiniMax M1 40k",41.199999999999996,37.8,81.5397,95.3072,98.9339,74.2674,47.8496,20.9,14.1,{"aa_id":3901,"ppt_model_id":3902,"slug":1432,"model_name":1433,"provider_name":2665,"name":1433,"provider":2665,"aa_name":3903,"is_open":37,"author_country":2666,"release_date":1435,"release_month":1374,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":901,"output_price_per_1m_tokens":377,"input_price":901,"output_price":377,"tokens_per_second":3904,"time_to_first_token":3905,"benchmark_aime":3906,"benchmark_aime_25":747,"benchmark_gpqa":567,"benchmark_hle":2787,"benchmark_ifbench":3648,"benchmark_lcr":2775,"benchmark_livecodebench":3326,"benchmark_math_hard":962,"benchmark_mmlu_pro":3907,"benchmark_scicode":3167,"benchmark_tau2":556,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3908,"benchmark_arc_challenge":3909,"benchmark_arc_easy":3910,"benchmark_bbeh":3911,"benchmark_bbh":3912,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3913,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3914,"benchmark_math":747,"benchmark_mbppplus":3915,"benchmark_medqa":3916,"benchmark_mmlu":3917,"benchmark_mmmu":3918,"benchmark_multichallenge":12,"benchmark_simpleqa":3919,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":3920,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1713,"benchmark_coding":3679},"2a00a0fd-4068-4f68-bc17-aea5dc09deba","6e68e635-72c6-412a-9954-34e6f36e7610","Mistral Small 3.2",123.718,0.361,32.300000000000004,68.10000000000001,62.3331,91.8089,97.7694,14.1814,76.4706,83.5366,55.5896,56.6138,70.4635,75.9957,55.8889,9.6625,5.6667,{"aa_id":3922,"ppt_model_id":3923,"slug":1446,"model_name":1447,"provider_name":1448,"name":1447,"provider":1448,"aa_name":1447,"is_open":37,"author_country":2817,"release_date":1450,"release_month":1374,"context_length":1451,"inference_mode":2654,"input_price_per_1m_tokens":1250,"output_price_per_1m_tokens":312,"input_price":1250,"output_price":312,"tokens_per_second":3924,"time_to_first_token":3925,"benchmark_aime":1086,"benchmark_aime_25":3926,"benchmark_gpqa":3927,"benchmark_hle":2912,"benchmark_ifbench":3928,"benchmark_lcr":363,"benchmark_livecodebench":1454,"benchmark_math_hard":3929,"benchmark_mmlu_pro":3930,"benchmark_scicode":3624,"benchmark_tau2":2667,"benchmark_terminalbench":2975,"benchmark_accountingaudit":12,"benchmark_agieval_zh":3931,"benchmark_agieval_en":3932,"benchmark_arc_challenge":3933,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3934,"benchmark_bfcl_v3":12,"benchmark_bird_critic":3935,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3936,"benchmark_humaneval":3937,"benchmark_ifeval":3938,"benchmark_knights_and_knaves":12,"benchmark_math":3926,"benchmark_mbppplus":3939,"benchmark_medqa":12,"benchmark_mmlu":3940,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3941,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":161,"benchmark_coding":2768},"4fadf2fa-4544-44f6-b55b-c81ae3ad9c5e","74fcee95-fc3b-429b-9447-3ded1e17b162",28.07,1.77,41.3,81.10000000000001,39.1,93.10000000000001,77.60000000000001,88.9762,74.1163,93.9759,85.6858,21.7241,94.6401,86.6242,85.3974,49.7312,84.5021,36.9006,{"aa_id":3943,"ppt_model_id":3944,"slug":1495,"model_name":1496,"provider_name":3823,"name":1496,"provider":3823,"aa_name":1496,"is_open":11,"author_country":2653,"release_date":1498,"release_month":1469,"context_length":981,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":3945,"time_to_first_token":3946,"benchmark_aime":1502,"benchmark_aime_25":3947,"benchmark_gpqa":1500,"benchmark_hle":3641,"benchmark_ifbench":183,"benchmark_lcr":3117,"benchmark_livecodebench":3365,"benchmark_math_hard":1501,"benchmark_mmlu_pro":1499,"benchmark_scicode":1134,"benchmark_tau2":3948,"benchmark_terminalbench":198,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":3949,"benchmark_arc_challenge":12,"benchmark_arc_easy":3950,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":3951,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3947,"benchmark_mbppplus":3953,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":3954,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1353,"benchmark_intelligence":3665,"benchmark_coding":209},"b6946da0-d1ec-4873-ad09-c3eacc3a7b41","a75404d3-fa0b-4234-9d98-7e7a34b22837",51.635,8.297,92.7,74.9,89.3166,99.0375,51.145,96.9512,63.1579,7.6667,{"aa_id":3956,"ppt_model_id":3957,"slug":1505,"model_name":1506,"provider_name":2665,"name":1506,"provider":2665,"aa_name":3958,"is_open":37,"author_country":2666,"release_date":1508,"release_month":1469,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":1509,"output_price_per_1m_tokens":1250,"input_price":1509,"output_price":1250,"tokens_per_second":3959,"time_to_first_token":323,"benchmark_aime":50,"benchmark_aime_25":2973,"benchmark_gpqa":1510,"benchmark_hle":3403,"benchmark_ifbench":3960,"benchmark_lcr":2098,"benchmark_livecodebench":1511,"benchmark_math_hard":553,"benchmark_mmlu_pro":1189,"benchmark_scicode":1236,"benchmark_tau2":3961,"benchmark_terminalbench":2975,"benchmark_accountingaudit":3962,"benchmark_agieval_zh":3963,"benchmark_agieval_en":3964,"benchmark_arc_challenge":3965,"benchmark_arc_easy":3966,"benchmark_bbeh":3967,"benchmark_bbh":3968,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":3969,"benchmark_gaia":12,"benchmark_gsm8k":3970,"benchmark_humaneval":3971,"benchmark_ifeval":12,"benchmark_knights_and_knaves":3506,"benchmark_math":589,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":3972,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3973,"benchmark_stock_bcs":3974,"benchmark_swe_bench_lite":12,"benchmark_wmdp":3975,"benchmark_wmt":3976,"benchmark_intelligence":1986,"benchmark_coding":3245},"3ece35f8-6a55-49e1-b011-5f44ad5d8d69","f21bd418-5d13-4b63-8f33-913ebd0bc78c","Devstral Small (Jul '25)",203.643,34.599999999999994,28.4,63.3333,59.7561,59.9764,90.4437,97.138,11.8584,64.8441,45.1,89.2343,77.439,73.4796,6.7268,41.6667,61.0414,34.1195,{"aa_id":3978,"ppt_model_id":3979,"slug":1514,"model_name":1515,"provider_name":2665,"name":1515,"provider":2665,"aa_name":1515,"is_open":37,"author_country":2666,"release_date":1517,"release_month":1469,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"tokens_per_second":3980,"time_to_first_token":3981,"benchmark_aime":429,"benchmark_aime_25":3012,"benchmark_gpqa":199,"benchmark_hle":2934,"benchmark_ifbench":121,"benchmark_lcr":983,"benchmark_livecodebench":917,"benchmark_math_hard":1024,"benchmark_mmlu_pro":710,"benchmark_scicode":3013,"benchmark_tau2":3982,"benchmark_terminalbench":3983,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3984,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3012,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1987,"benchmark_coding":2907},"cace95bc-70a7-4509-91b6-814744584047","26fd4e71-75b8-4b06-bd8c-bd0016dd7420",126.299,0.443,19.900000000000002,9.1,48.1339,{"aa_id":3986,"ppt_model_id":3987,"slug":1520,"model_name":1521,"provider_name":3988,"name":1521,"provider":3988,"aa_name":2102,"is_open":37,"author_country":2817,"release_date":1524,"release_month":1469,"context_length":311,"inference_mode":2654,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":1153,"input_price":708,"output_price":1153,"tokens_per_second":3989,"time_to_first_token":3990,"benchmark_aime":1528,"benchmark_aime_25":3252,"benchmark_gpqa":1677,"benchmark_hle":890,"benchmark_ifbench":3907,"benchmark_lcr":3991,"benchmark_livecodebench":994,"benchmark_math_hard":1527,"benchmark_mmlu_pro":1112,"benchmark_scicode":879,"benchmark_tau2":860,"benchmark_terminalbench":3761,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3992,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3993,"benchmark_bfcl_v3":3789,"benchmark_bird_critic":12,"benchmark_darkbench":3994,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3995,"benchmark_humaneval":12,"benchmark_ifeval":3996,"benchmark_knights_and_knaves":12,"benchmark_math":1794,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":3997,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3998,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1645,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1526,"benchmark_intelligence":1610,"benchmark_coding":447},"8e0fd5e4-4856-42fb-ba7b-00b3ea9292fc","ebe5a680-6505-450b-870e-5891c0a15eb2","Kimi",98.887,0.808,66.3,82.9929,87.0834,48.6364,94.9962,87.6155,88.2539,26.5202,{"aa_id":4000,"ppt_model_id":3987,"slug":1520,"model_name":1521,"provider_name":3988,"name":1521,"provider":3988,"aa_name":4001,"is_open":37,"author_country":2817,"release_date":1524,"release_month":1469,"context_length":311,"inference_mode":2654,"input_price_per_1m_tokens":708,"output_price_per_1m_tokens":1153,"input_price":708,"output_price":1153,"tokens_per_second":4002,"time_to_first_token":4003,"benchmark_aime":1528,"benchmark_aime_25":4004,"benchmark_gpqa":1003,"benchmark_hle":2897,"benchmark_ifbench":3665,"benchmark_lcr":974,"benchmark_livecodebench":3554,"benchmark_math_hard":1527,"benchmark_mmlu_pro":4005,"benchmark_scicode":2071,"benchmark_tau2":878,"benchmark_terminalbench":2907,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":3992,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":3993,"benchmark_bfcl_v3":3789,"benchmark_bird_critic":12,"benchmark_darkbench":3994,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3995,"benchmark_humaneval":12,"benchmark_ifeval":3996,"benchmark_knights_and_knaves":12,"benchmark_math":1794,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":3997,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":3998,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1645,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1526,"benchmark_intelligence":1610,"benchmark_coding":447},"f70ed347-1111-4638-af99-e0655733a6e4","Kimi K2",34.987,1.02,56.99999999999999,82.39999999999999,{"aa_id":4007,"ppt_model_id":4008,"slug":1539,"model_name":1540,"provider_name":1833,"name":1540,"provider":1833,"aa_name":4009,"is_open":37,"author_country":2817,"release_date":1542,"release_month":1469,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":1543,"output_price_per_1m_tokens":495,"input_price":1543,"output_price":495,"tokens_per_second":4010,"time_to_first_token":4011,"benchmark_aime":769,"benchmark_aime_25":769,"benchmark_gpqa":1259,"benchmark_hle":2812,"benchmark_ifbench":4012,"benchmark_lcr":2972,"benchmark_livecodebench":4013,"benchmark_math_hard":1378,"benchmark_mmlu_pro":1187,"benchmark_scicode":2337,"benchmark_tau2":3213,"benchmark_terminalbench":1986,"benchmark_accountingaudit":12,"benchmark_agieval_zh":4014,"benchmark_agieval_en":3462,"benchmark_arc_challenge":4015,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4016,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4017,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4018,"benchmark_humaneval":3285,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":769,"benchmark_mbppplus":4019,"benchmark_medqa":4020,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":4021,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4022,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":174,"benchmark_coding":447},"41c14978-61f4-4f01-8548-39826454e80c","def3066a-ef70-4379-8fe2-458aceb625fd","Qwen3 235B A22B 2507 Instruct",65.134,1.07,46.1,52.400000000000006,84.3681,94.7952,87.3733,30.9417,88.7036,62.6984,84.7604,50.601,36.3333,{"aa_id":4024,"ppt_model_id":4025,"slug":1546,"model_name":4026,"provider_name":248,"name":1547,"provider":248,"aa_name":4027,"is_open":11,"author_country":2653,"release_date":1549,"release_month":1469,"context_length":856,"inference_mode":3250,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":4028,"time_to_first_token":4029,"benchmark_aime":316,"benchmark_aime_25":4030,"benchmark_gpqa":1552,"benchmark_hle":2722,"benchmark_ifbench":212,"benchmark_lcr":4031,"benchmark_livecodebench":1553,"benchmark_math_hard":4032,"benchmark_mmlu_pro":1551,"benchmark_scicode":3460,"benchmark_tau2":3475,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4033,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4034,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1553,"benchmark_mmlu_pro_reasoning":1551,"benchmark_gpqa_reasoning":1552,"benchmark_math_hard_reasoning":1554,"benchmark_aime_reasoning":316,"benchmark_aime_25_reasoning":1079,"benchmark_hle_reasoning":2722,"benchmark_scicode_reasoning":3460,"benchmark_ifbench_reasoning":212,"benchmark_lcr_reasoning":4035,"benchmark_terminalbench_reasoning":545,"benchmark_tau2_reasoning":3475,"benchmark_intelligence":3046,"benchmark_coding":291,"benchmark_intelligence_reasoning":1556,"benchmark_coding_reasoning":1555,"benchmark_math_reasoning":1079},"f712de24-cddf-4249-9513-2e28af53381a","ed39bf6d-570e-45b6-b6f4-3d701cff678f","Gemini 2.5 Flash Lite (Reasoning)","Gemini 2.5 Flash-Lite (Reasoning)",312.341,20.173,53.300000000000004,51.300000000000004,96.89999999999999,58.0126,35.3,51.3,{"aa_id":4037,"ppt_model_id":4025,"slug":1546,"model_name":1547,"provider_name":248,"name":1547,"provider":248,"aa_name":4038,"is_open":11,"author_country":2653,"release_date":1549,"release_month":1469,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":4039,"time_to_first_token":4040,"benchmark_aime":497,"benchmark_aime_25":4034,"benchmark_gpqa":146,"benchmark_hle":3403,"benchmark_ifbench":3624,"benchmark_lcr":3239,"benchmark_livecodebench":1201,"benchmark_math_hard":4041,"benchmark_mmlu_pro":3293,"benchmark_scicode":3037,"benchmark_tau2":1243,"benchmark_terminalbench":363,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4033,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4034,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1553,"benchmark_mmlu_pro_reasoning":1551,"benchmark_gpqa_reasoning":1552,"benchmark_math_hard_reasoning":1554,"benchmark_aime_reasoning":316,"benchmark_aime_25_reasoning":1079,"benchmark_hle_reasoning":2722,"benchmark_scicode_reasoning":3460,"benchmark_ifbench_reasoning":212,"benchmark_lcr_reasoning":4035,"benchmark_terminalbench_reasoning":545,"benchmark_tau2_reasoning":3475,"benchmark_intelligence":3046,"benchmark_coding":291,"benchmark_intelligence_reasoning":1556,"benchmark_coding_reasoning":1555,"benchmark_math_reasoning":1079},"98a51145-4729-42bc-ab22-2c9379886ea1","Gemini 2.5 Flash-Lite (Non-reasoning)",283.227,0.291,92.60000000000001,{"aa_id":4043,"ppt_model_id":4044,"slug":1566,"model_name":1567,"provider_name":1833,"name":1567,"provider":1833,"aa_name":4045,"is_open":37,"author_country":2817,"release_date":1569,"release_month":1469,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":1570,"output_price_per_1m_tokens":312,"input_price":1570,"output_price":312,"tokens_per_second":4046,"time_to_first_token":4047,"benchmark_aime":4048,"benchmark_aime_25":3237,"benchmark_gpqa":1572,"benchmark_hle":2710,"benchmark_ifbench":209,"benchmark_lcr":3515,"benchmark_livecodebench":1573,"benchmark_math_hard":3424,"benchmark_mmlu_pro":1571,"benchmark_scicode":784,"benchmark_tau2":4049,"benchmark_terminalbench":2711,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4050,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":4051,"benchmark_ifeval":4052,"benchmark_knights_and_knaves":12,"benchmark_math":4053,"benchmark_mbppplus":3186,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4054,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1050,"benchmark_coding":2720},"86abd698-c384-4faa-9930-c956e40ed1f4","b04ba9cb-b536-4335-97dc-d992337a7aa9","Qwen3 Coder 480B A35B Instruct",65.699,1.588,47.699999999999996,43.6,30.9859,92.6829,82.8096,39.3,44.6667,{"aa_id":4056,"ppt_model_id":4057,"slug":1585,"model_name":4058,"provider_name":1833,"name":1586,"provider":1833,"aa_name":4059,"is_open":37,"author_country":2817,"release_date":1588,"release_month":1469,"context_length":1477,"inference_mode":3250,"input_price_per_1m_tokens":1589,"output_price_per_1m_tokens":312,"input_price":1589,"output_price":312,"tokens_per_second":4060,"time_to_first_token":4061,"benchmark_aime":1158,"benchmark_aime_25":918,"benchmark_gpqa":944,"benchmark_hle":161,"benchmark_ifbench":1109,"benchmark_lcr":725,"benchmark_livecodebench":1571,"benchmark_math_hard":1590,"benchmark_mmlu_pro":1268,"benchmark_scicode":879,"benchmark_tau2":4062,"benchmark_terminalbench":3527,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1571,"benchmark_mmlu_pro_reasoning":1268,"benchmark_gpqa_reasoning":944,"benchmark_math_hard_reasoning":1590,"benchmark_aime_reasoning":1158,"benchmark_aime_25_reasoning":918,"benchmark_hle_reasoning":161,"benchmark_scicode_reasoning":879,"benchmark_ifbench_reasoning":1109,"benchmark_lcr_reasoning":725,"benchmark_terminalbench_reasoning":3229,"benchmark_tau2_reasoning":4062,"benchmark_intelligence_reasoning":556,"benchmark_coding_reasoning":328,"benchmark_math_reasoning":918},"25ae5e9d-4edb-4e41-9fab-07033501c750","7b9c3ea7-4768-45c8-8161-93454a2c1ee6","Qwen3 235B A22B Thinking 2507 (Reasoning)","Qwen3 235B A22B 2507 (Reasoning)",40.16,1.402,53.2,{"aa_id":4064,"ppt_model_id":4065,"slug":1593,"model_name":1594,"provider_name":4066,"name":1594,"provider":4066,"aa_name":4067,"is_open":37,"author_country":2653,"release_date":1596,"release_month":1469,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":370,"input_price":808,"output_price":370,"tokens_per_second":4068,"time_to_first_token":4069,"benchmark_aime":4070,"benchmark_aime_25":1208,"benchmark_gpqa":487,"benchmark_hle":2753,"benchmark_ifbench":302,"benchmark_lcr":1136,"benchmark_livecodebench":1598,"benchmark_math_hard":1599,"benchmark_mmlu_pro":1597,"benchmark_scicode":4071,"benchmark_tau2":484,"benchmark_terminalbench":3061,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4072,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4073,"benchmark_bfcl_v3":4074,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1208,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":328,"benchmark_coding":4075},"7e94429a-1ca7-48b2-ab04-0773e680fa21","866f66d3-77a2-484d-b8e7-49208111081e","Z AI","GLM-4.5-Air",94.591,0.609,67.30000000000001,30.599999999999998,66.3654,77.945,69.1061,23.8,{"aa_id":4077,"ppt_model_id":4078,"slug":1603,"model_name":4079,"provider_name":4066,"name":1604,"provider":4066,"aa_name":4080,"is_open":37,"author_country":2653,"release_date":1606,"release_month":1469,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":274,"output_price_per_1m_tokens":1153,"input_price":274,"output_price":1153,"tokens_per_second":4081,"time_to_first_token":4082,"benchmark_aime":905,"benchmark_aime_25":160,"benchmark_gpqa":1607,"benchmark_hle":4083,"benchmark_ifbench":30,"benchmark_lcr":201,"benchmark_livecodebench":1608,"benchmark_math_hard":4084,"benchmark_mmlu_pro":785,"benchmark_scicode":3429,"benchmark_tau2":1124,"benchmark_terminalbench":995,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4085,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4086,"benchmark_bfcl_v3":4087,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":3954,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1608,"benchmark_mmlu_pro_reasoning":785,"benchmark_gpqa_reasoning":1607,"benchmark_math_hard_reasoning":1609,"benchmark_aime_reasoning":905,"benchmark_aime_25_reasoning":160,"benchmark_hle_reasoning":4083,"benchmark_scicode_reasoning":3429,"benchmark_ifbench_reasoning":30,"benchmark_lcr_reasoning":201,"benchmark_terminalbench_reasoning":995,"benchmark_tau2_reasoning":1124,"benchmark_intelligence_reasoning":1611,"benchmark_coding_reasoning":1610,"benchmark_math_reasoning":160},"09ea21b1-9a64-4d2d-b6f5-81082a1c3268","a0c8b9c9-1fb6-4b89-9c1c-ef5c1bad8887","GLM 4.5 (Reasoning)","GLM-4.5 (Reasoning)",48.187,0.835,12.2,97.89999999999999,80.9223,83.7788,76.7395,{"aa_id":4089,"ppt_model_id":4090,"slug":1614,"model_name":1615,"provider_name":1833,"name":1615,"provider":1833,"aa_name":4091,"is_open":37,"author_country":2817,"release_date":1617,"release_month":1469,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":50,"input_price":404,"output_price":50,"tokens_per_second":4092,"time_to_first_token":4093,"benchmark_aime":1200,"benchmark_aime_25":3991,"benchmark_gpqa":1021,"benchmark_hle":2753,"benchmark_ifbench":2733,"benchmark_lcr":4094,"benchmark_livecodebench":130,"benchmark_math_hard":1618,"benchmark_mmlu_pro":1255,"benchmark_scicode":2860,"benchmark_tau2":4095,"benchmark_terminalbench":2975,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3991,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":161,"benchmark_coding":1272},"3c62ea6d-55d7-4346-952c-a708ca692fac","5ce1fc67-0ea7-45db-941a-41e5dd6b9834","Qwen3 30B A3B 2507 Instruct",57.046,1.147,22.7,10.2,{"aa_id":4097,"ppt_model_id":4098,"slug":1621,"model_name":1622,"provider_name":1833,"name":1622,"provider":1833,"aa_name":1622,"is_open":37,"author_country":2817,"release_date":1624,"release_month":1469,"context_length":1625,"inference_mode":2654,"input_price_per_1m_tokens":1509,"output_price_per_1m_tokens":1626,"input_price":1509,"output_price":1626,"tokens_per_second":4099,"time_to_first_token":4100,"benchmark_aime":28,"benchmark_aime_25":3299,"benchmark_gpqa":449,"benchmark_hle":69,"benchmark_ifbench":1186,"benchmark_lcr":3299,"benchmark_livecodebench":3253,"benchmark_math_hard":973,"benchmark_mmlu_pro":1627,"benchmark_scicode":3649,"benchmark_tau2":2071,"benchmark_terminalbench":1986,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3725,"benchmark_humaneval":12,"benchmark_ifeval":4101,"benchmark_knights_and_knaves":12,"benchmark_math":936,"benchmark_mbppplus":3224,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":436,"benchmark_coding":4102},"7c675f29-c49a-4c4b-aa17-2a53c92f2c88","ea0ca2c2-4baf-45b2-a74c-163b70312aa1",27.237,1.424,78.7431,19.4,{"aa_id":4104,"ppt_model_id":4105,"slug":1639,"model_name":4106,"provider_name":138,"name":1640,"provider":138,"aa_name":4107,"is_open":11,"author_country":2653,"release_date":1642,"release_month":1635,"context_length":142,"inference_mode":3250,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1351,"input_price":161,"output_price":1351,"tokens_per_second":4108,"time_to_first_token":4109,"benchmark_aime":12,"benchmark_aime_25":3281,"benchmark_gpqa":1066,"benchmark_hle":2721,"benchmark_ifbench":4110,"benchmark_lcr":3991,"benchmark_livecodebench":414,"benchmark_math_hard":12,"benchmark_mmlu_pro":1643,"benchmark_scicode":326,"benchmark_tau2":2945,"benchmark_terminalbench":3596,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4111,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3496,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":414,"benchmark_mmlu_pro_reasoning":1643,"benchmark_gpqa_reasoning":1066,"benchmark_aime_25_reasoning":887,"benchmark_hle_reasoning":2828,"benchmark_scicode_reasoning":326,"benchmark_ifbench_reasoning":1920,"benchmark_lcr_reasoning":3991,"benchmark_terminalbench_reasoning":1184,"benchmark_tau2_reasoning":569,"benchmark_intelligence":2337,"benchmark_intelligence_reasoning":1645,"benchmark_coding_reasoning":1644,"benchmark_math_reasoning":887},"d09b3091-396a-4ddd-8b32-6580486e124c","7decccab-2a1f-40c4-896d-beaee9bd9a21","Claude Opus 4.1 (Reasoning)","Claude 4.1 Opus (Reasoning)",35.356,8.769,55.400000000000006,83.4448,{"aa_id":4113,"ppt_model_id":4105,"slug":1639,"model_name":1640,"provider_name":138,"name":1640,"provider":138,"aa_name":4114,"is_open":11,"author_country":2653,"release_date":1642,"release_month":1635,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":161,"output_price_per_1m_tokens":1351,"input_price":161,"output_price":1351,"tokens_per_second":4115,"time_to_first_token":4116,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4111,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3496,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":414,"benchmark_mmlu_pro_reasoning":1643,"benchmark_gpqa_reasoning":1066,"benchmark_aime_25_reasoning":887,"benchmark_hle_reasoning":2828,"benchmark_scicode_reasoning":326,"benchmark_ifbench_reasoning":1920,"benchmark_lcr_reasoning":3991,"benchmark_terminalbench_reasoning":1184,"benchmark_tau2_reasoning":569,"benchmark_intelligence":2337,"benchmark_intelligence_reasoning":1645,"benchmark_coding_reasoning":1644,"benchmark_math_reasoning":887},"80890ad1-2139-4d02-90e4-15f8c58ba799","Claude 4.1 Opus (Non-reasoning)",34.685,1.563,{"aa_id":4118,"ppt_model_id":4119,"slug":1648,"model_name":1649,"provider_name":9,"name":1649,"provider":9,"aa_name":4120,"is_open":37,"author_country":2653,"release_date":1651,"release_month":1635,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":207,"output_price_per_1m_tokens":495,"input_price":207,"output_price":495,"tokens_per_second":4121,"time_to_first_token":4122,"benchmark_aime":12,"benchmark_aime_25":973,"benchmark_gpqa":1652,"benchmark_hle":2702,"benchmark_ifbench":4123,"benchmark_lcr":2896,"benchmark_livecodebench":1255,"benchmark_math_hard":12,"benchmark_mmlu_pro":767,"benchmark_scicode":2045,"benchmark_tau2":4124,"benchmark_terminalbench":2812,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4125,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4126,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":1158,"benchmark_math":973,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4127,"benchmark_coding":904},"31b375c1-718e-475d-83bf-3b98f61cbc5e","e8187451-bfc4-4c3a-99e8-8a29f106c9ac","gpt-oss-20B (high)",271.094,0.449,65.10000000000001,60.199999999999996,79.5678,84.0573,24.5,{"aa_id":4129,"ppt_model_id":4130,"slug":1655,"model_name":1656,"provider_name":9,"name":1656,"provider":9,"aa_name":4131,"is_open":37,"author_country":2653,"release_date":1658,"release_month":1635,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":1659,"output_price_per_1m_tokens":495,"input_price":1659,"output_price":495,"tokens_per_second":4132,"time_to_first_token":4133,"benchmark_aime":12,"benchmark_aime_25":1340,"benchmark_gpqa":1607,"benchmark_hle":904,"benchmark_ifbench":483,"benchmark_lcr":4134,"benchmark_livecodebench":4135,"benchmark_math_hard":12,"benchmark_mmlu_pro":3562,"benchmark_scicode":4136,"benchmark_tau2":4137,"benchmark_terminalbench":3092,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4138,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4139,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4140,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3690,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":4141,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1241,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1662,"benchmark_intelligence":4127,"benchmark_coding":3151},"e6191a58-b31e-45fc-9121-8070c710ae0c","da80cf0c-78c4-46e2-82c9-af9bb1547843","gpt-oss-120B (high)",228.141,0.509,50.7,87.8,38.9,65.8,82.718,82.1352,25.7627,87.6228,{"aa_id":4143,"ppt_model_id":4130,"slug":1655,"model_name":1656,"provider_name":9,"name":1656,"provider":9,"aa_name":4144,"is_open":37,"author_country":2653,"release_date":1658,"release_month":1635,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":1659,"output_price_per_1m_tokens":495,"input_price":1659,"output_price":495,"tokens_per_second":4145,"time_to_first_token":4146,"benchmark_aime":12,"benchmark_aime_25":3690,"benchmark_gpqa":1661,"benchmark_hle":2835,"benchmark_ifbench":4147,"benchmark_lcr":1136,"benchmark_livecodebench":1024,"benchmark_math_hard":12,"benchmark_mmlu_pro":1660,"benchmark_scicode":2337,"benchmark_tau2":4148,"benchmark_terminalbench":1146,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4138,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4139,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4140,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3690,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":4141,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1241,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1662,"benchmark_intelligence":4127,"benchmark_coding":3151},"3ab2f5ef-63ab-4e1a-b701-0cf8d2910537","gpt-oss-120B (low)",218.952,0.506,58.3,45,{"aa_id":4150,"ppt_model_id":4151,"slug":1665,"model_name":1666,"provider_name":9,"name":1666,"provider":9,"aa_name":4152,"is_open":11,"author_country":2653,"release_date":1668,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":536,"input_price":299,"output_price":536,"tokens_per_second":4153,"time_to_first_token":4154,"benchmark_aime":12,"benchmark_aime_25":891,"benchmark_gpqa":2778,"benchmark_hle":3300,"benchmark_ifbench":2778,"benchmark_lcr":2933,"benchmark_livecodebench":279,"benchmark_math_hard":12,"benchmark_mmlu_pro":1943,"benchmark_scicode":2906,"benchmark_tau2":1644,"benchmark_terminalbench":3245,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4155,"benchmark_bbh":4156,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3777,"benchmark_mbppplus":3535,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1209,"benchmark_coding":1272},"e348b502-6b1f-4b25-a720-b047ac11525a","f729e7ab-69a2-402d-9a36-a4af8d2bbddb","GPT-5 nano (high)",145.396,83.794,29.292,86.881,{"aa_id":4158,"ppt_model_id":4151,"slug":1665,"model_name":1666,"provider_name":9,"name":1666,"provider":9,"aa_name":4159,"is_open":11,"author_country":2653,"release_date":1668,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":536,"input_price":299,"output_price":536,"tokens_per_second":4160,"time_to_first_token":4161,"benchmark_aime":12,"benchmark_aime_25":4162,"benchmark_gpqa":725,"benchmark_hle":3413,"benchmark_ifbench":1021,"benchmark_lcr":1201,"benchmark_livecodebench":1224,"benchmark_math_hard":12,"benchmark_mmlu_pro":511,"benchmark_scicode":4163,"benchmark_tau2":2860,"benchmark_terminalbench":1191,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4155,"benchmark_bbh":4156,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3777,"benchmark_mbppplus":3535,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1209,"benchmark_coding":1272},"8e712a16-2bbe-4855-a5a7-516188efe42e","GPT-5 nano (medium)",141.965,45.267,78.3,33.800000000000004,{"aa_id":4165,"ppt_model_id":4151,"slug":1665,"model_name":1666,"provider_name":9,"name":1666,"provider":9,"aa_name":4166,"is_open":11,"author_country":2653,"release_date":1668,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":536,"input_price":299,"output_price":536,"tokens_per_second":4167,"time_to_first_token":4168,"benchmark_aime":12,"benchmark_aime_25":3777,"benchmark_gpqa":959,"benchmark_hle":2699,"benchmark_ifbench":1944,"benchmark_lcr":436,"benchmark_livecodebench":1219,"benchmark_math_hard":12,"benchmark_mmlu_pro":3554,"benchmark_scicode":2692,"benchmark_tau2":4169,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4155,"benchmark_bbh":4156,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3777,"benchmark_mbppplus":3535,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1209,"benchmark_coding":1272},"1b885110-1f86-4ecb-8294-18d840a66142","GPT-5 nano (minimal)",126.566,0.824,25.7,{"aa_id":4171,"ppt_model_id":4172,"slug":1672,"model_name":1673,"provider_name":9,"name":1673,"provider":9,"aa_name":4173,"is_open":11,"author_country":2653,"release_date":1675,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":1676,"output_price_per_1m_tokens":61,"input_price":1676,"output_price":61,"tokens_per_second":4174,"time_to_first_token":4175,"benchmark_aime":12,"benchmark_aime_25":1323,"benchmark_gpqa":1187,"benchmark_hle":2295,"benchmark_ifbench":4176,"benchmark_lcr":3117,"benchmark_livecodebench":1677,"benchmark_math_hard":12,"benchmark_mmlu_pro":891,"benchmark_scicode":2350,"benchmark_tau2":1598,"benchmark_terminalbench":3213,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4177,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4178,"benchmark_bbh":4179,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":4180,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1323,"benchmark_mbppplus":3186,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4181,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4182,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4183,"benchmark_coding":4034},"2247f4b1-9f46-4b16-b141-b8fc750d8c5b","edb32b20-7b08-4e69-893e-4b4255fb1795","GPT-5 mini (high)",76.202,86.261,75.4,87.117,54.8894,87.7438,44.8485,75.3333,38.3333,41.2,{"aa_id":4185,"ppt_model_id":4186,"slug":1680,"model_name":1681,"provider_name":9,"name":1681,"provider":9,"aa_name":4187,"is_open":11,"author_country":2653,"release_date":1683,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"tokens_per_second":4188,"time_to_first_token":4189,"benchmark_aime":943,"benchmark_aime_25":1502,"benchmark_gpqa":4190,"benchmark_hle":3411,"benchmark_ifbench":4191,"benchmark_lcr":4192,"benchmark_livecodebench":2347,"benchmark_math_hard":4193,"benchmark_mmlu_pro":1221,"benchmark_scicode":4194,"benchmark_tau2":1112,"benchmark_terminalbench":1111,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":4195,"benchmark_arc_challenge":4196,"benchmark_arc_easy":12,"benchmark_bbeh":4197,"benchmark_bbh":4198,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4199,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2096,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4200,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2924,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1643,"benchmark_intelligence":3641,"benchmark_coding":3412},"ebbf0fc5-d004-4f60-ab39-2449e3a340f5","9829faeb-73e7-46ff-b7be-bc158b920364","GPT-5 (high)",97.092,85.601,85.39999999999999,73.1,75.6,99.4,42.9,91.3983,96.3311,64.115,90.9356,94.8446,79.0541,{"aa_id":4202,"ppt_model_id":4186,"slug":1680,"model_name":1681,"provider_name":9,"name":1681,"provider":9,"aa_name":4203,"is_open":11,"author_country":2653,"release_date":1683,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"tokens_per_second":4204,"time_to_first_token":2292,"benchmark_aime":2156,"benchmark_aime_25":2156,"benchmark_gpqa":513,"benchmark_hle":3092,"benchmark_ifbench":1627,"benchmark_lcr":4205,"benchmark_livecodebench":316,"benchmark_math_hard":1343,"benchmark_mmlu_pro":4206,"benchmark_scicode":4207,"benchmark_tau2":1861,"benchmark_terminalbench":198,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":4195,"benchmark_arc_challenge":4196,"benchmark_arc_easy":12,"benchmark_bbeh":4197,"benchmark_bbh":4198,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4199,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2096,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4200,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2924,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1643,"benchmark_intelligence":3641,"benchmark_coding":3412},"79b5eaf1-a41b-4322-bb89-2bc1e3ffc0da","GPT-5 (medium)",86.366,72.8,86.7,41.099999999999994,{"aa_id":4209,"ppt_model_id":4186,"slug":1680,"model_name":1681,"provider_name":9,"name":1681,"provider":9,"aa_name":4210,"is_open":11,"author_country":2653,"release_date":1683,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"tokens_per_second":4211,"time_to_first_token":4212,"benchmark_aime":2393,"benchmark_aime_25":2393,"benchmark_gpqa":3562,"benchmark_hle":3475,"benchmark_ifbench":3525,"benchmark_lcr":3199,"benchmark_livecodebench":1224,"benchmark_math_hard":4213,"benchmark_mmlu_pro":871,"benchmark_scicode":3928,"benchmark_tau2":513,"benchmark_terminalbench":3411,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":4195,"benchmark_arc_challenge":4196,"benchmark_arc_easy":12,"benchmark_bbeh":4197,"benchmark_bbh":4198,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4199,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2096,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4200,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2924,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1643,"benchmark_intelligence":3641,"benchmark_coding":3412},"aa00917f-4148-45dd-9b88-a40c527389aa","GPT-5 (low)",77.859,7.238,98.7,{"aa_id":4215,"ppt_model_id":4186,"slug":1680,"model_name":1681,"provider_name":9,"name":1681,"provider":9,"aa_name":4216,"is_open":11,"author_country":2653,"release_date":1683,"release_month":1635,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"tokens_per_second":4217,"time_to_first_token":4218,"benchmark_aime":1686,"benchmark_aime_25":2096,"benchmark_gpqa":4070,"benchmark_hle":4219,"benchmark_ifbench":4220,"benchmark_lcr":174,"benchmark_livecodebench":4221,"benchmark_math_hard":1685,"benchmark_mmlu_pro":3526,"benchmark_scicode":3301,"benchmark_tau2":725,"benchmark_terminalbench":4222,"benchmark_accountingaudit":3190,"benchmark_agieval_zh":12,"benchmark_agieval_en":4195,"benchmark_arc_challenge":4196,"benchmark_arc_easy":12,"benchmark_bbeh":4197,"benchmark_bbh":4198,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4199,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2096,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4200,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2924,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1643,"benchmark_intelligence":3641,"benchmark_coding":3412},"78c2f890-aa5d-4399-9ab9-be68916ff829","GPT-5 (minimal)",66.995,1.006,5.4,45.6,55.800000000000004,18.2,{"aa_id":4224,"ppt_model_id":4225,"slug":1695,"model_name":1696,"provider_name":4226,"name":1696,"provider":4226,"aa_name":4227,"is_open":11,"author_country":4228,"release_date":1699,"release_month":1635,"context_length":981,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":615,"input_price":78,"output_price":615,"tokens_per_second":4229,"time_to_first_token":4230,"benchmark_aime":230,"benchmark_aime_25":363,"benchmark_gpqa":1071,"benchmark_hle":2934,"benchmark_ifbench":4231,"benchmark_lcr":2775,"benchmark_livecodebench":3702,"benchmark_math_hard":17,"benchmark_mmlu_pro":4232,"benchmark_scicode":361,"benchmark_tau2":3005,"benchmark_terminalbench":363,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":363,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1712,"benchmark_coding":4233},"682b9f16-63e9-4f2b-aee4-d1d944825d83","27f1a079-c301-4647-9f15-2837cdd20f45","AI21 Labs","Jamba 1.7 Large","il",55.279,0.737,35.199999999999996,57.699999999999996,7.8,{"aa_id":4235,"ppt_model_id":4236,"slug":1704,"model_name":4237,"provider_name":4066,"name":1705,"provider":4066,"aa_name":4238,"is_open":37,"author_country":2653,"release_date":1707,"release_month":1635,"context_length":181,"inference_mode":3250,"input_price_per_1m_tokens":274,"output_price_per_1m_tokens":1708,"input_price":274,"output_price":1708,"tokens_per_second":4239,"time_to_first_token":4240,"benchmark_aime":12,"benchmark_aime_25":1211,"benchmark_gpqa":1598,"benchmark_hle":3691,"benchmark_ifbench":4241,"benchmark_lcr":2667,"benchmark_livecodebench":768,"benchmark_math_hard":12,"benchmark_mmlu_pro":1571,"benchmark_scicode":447,"benchmark_tau2":4242,"benchmark_terminalbench":1146,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1260,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":768,"benchmark_mmlu_pro_reasoning":1571,"benchmark_gpqa_reasoning":1598,"benchmark_aime_25_reasoning":1211,"benchmark_hle_reasoning":4243,"benchmark_scicode_reasoning":447,"benchmark_ifbench_reasoning":4241,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":1146,"benchmark_tau2_reasoning":4242,"benchmark_intelligence":3046,"benchmark_coding":2900,"benchmark_intelligence_reasoning":1713,"benchmark_coding_reasoning":1712,"benchmark_math_reasoning":1211},"5f768b47-797b-43c9-a536-3ad24c0590c6","91f39b7b-638d-4460-a462-f92015000df4","GLM 4.5V (Reasoning)","GLM-4.5V (Reasoning)",49.31,1.091,34.2,22.5,5.9,{"aa_id":4245,"ppt_model_id":4236,"slug":1704,"model_name":1705,"provider_name":4066,"name":1705,"provider":4066,"aa_name":4246,"is_open":37,"author_country":2653,"release_date":1707,"release_month":1635,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":274,"output_price_per_1m_tokens":1708,"input_price":274,"output_price":1708,"tokens_per_second":4247,"time_to_first_token":4248,"benchmark_aime":12,"benchmark_aime_25":3206,"benchmark_gpqa":1710,"benchmark_hle":2943,"benchmark_ifbench":2789,"benchmark_lcr":2667,"benchmark_livecodebench":4231,"benchmark_math_hard":12,"benchmark_mmlu_pro":1709,"benchmark_scicode":361,"benchmark_tau2":437,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1260,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":768,"benchmark_mmlu_pro_reasoning":1571,"benchmark_gpqa_reasoning":1598,"benchmark_aime_25_reasoning":1211,"benchmark_hle_reasoning":4243,"benchmark_scicode_reasoning":447,"benchmark_ifbench_reasoning":4241,"benchmark_lcr_reasoning":2667,"benchmark_terminalbench_reasoning":1146,"benchmark_tau2_reasoning":4242,"benchmark_intelligence":3046,"benchmark_coding":2900,"benchmark_intelligence_reasoning":1713,"benchmark_coding_reasoning":1712,"benchmark_math_reasoning":1211},"b3cec8ea-6db8-4fbf-94c6-31e4f8bd35f7","GLM-4.5V (Non-reasoning)",51.346,17.178,{"aa_id":4250,"ppt_model_id":4251,"slug":1731,"model_name":1732,"provider_name":2665,"name":1732,"provider":2665,"aa_name":1732,"is_open":11,"author_country":2666,"release_date":1734,"release_month":1635,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"tokens_per_second":4252,"time_to_first_token":4253,"benchmark_aime":12,"benchmark_aime_25":388,"benchmark_gpqa":1735,"benchmark_hle":2710,"benchmark_ifbench":3238,"benchmark_lcr":2295,"benchmark_livecodebench":1239,"benchmark_math_hard":12,"benchmark_mmlu_pro":2965,"benchmark_scicode":4163,"benchmark_tau2":1239,"benchmark_terminalbench":2812,"benchmark_accountingaudit":12,"benchmark_agieval_zh":4254,"benchmark_agieval_en":4255,"benchmark_arc_challenge":3441,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4256,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":4257,"benchmark_gsm8k":12,"benchmark_humaneval":4258,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":388,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4259,"benchmark_multichallenge":4260,"benchmark_simpleqa":4261,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4262,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":317,"benchmark_coding":3388},"08705411-1008-4a50-b1ea-a2005731765e","4e940cfd-9acd-4fec-b1bf-9f6d5cfb8058",63.477,0.414,74.1685,71.8775,80.4945,23.3083,88.4146,58.1111,37.3626,20.5039,36.4548,{"aa_id":4264,"ppt_model_id":4265,"slug":1738,"model_name":1739,"provider_name":3115,"name":1739,"provider":3115,"aa_name":4266,"is_open":37,"author_country":2817,"release_date":1741,"release_month":1635,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":60,"input_price":273,"output_price":60,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":2199,"benchmark_gpqa":1743,"benchmark_hle":1004,"benchmark_ifbench":3892,"benchmark_lcr":4148,"benchmark_livecodebench":4232,"benchmark_math_hard":12,"benchmark_mmlu_pro":1742,"benchmark_scicode":1686,"benchmark_tau2":3429,"benchmark_terminalbench":4267,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4268,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":4269,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2199,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":4270,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4271,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1155,"benchmark_mmlu_pro_reasoning":1744,"benchmark_gpqa_reasoning":857,"benchmark_aime_25_reasoning":1745,"benchmark_hle_reasoning":880,"benchmark_scicode_reasoning":3928,"benchmark_ifbench_reasoning":3665,"benchmark_lcr_reasoning":1079,"benchmark_terminalbench_reasoning":174,"benchmark_tau2_reasoning":145,"benchmark_intelligence":3366,"benchmark_coding":3961,"benchmark_intelligence_reasoning":906,"benchmark_coding_reasoning":28,"benchmark_math_reasoning":1745},"8c02b4b8-17a9-4d10-8a49-0b8f7c1bd66b","e259e725-015c-4294-8fec-a441b8e4e065","DeepSeek V3.1 (Non-reasoning)",24.2,79.7722,11.5152,23.2779,14.3333,{"aa_id":4273,"ppt_model_id":4265,"slug":1738,"model_name":4274,"provider_name":3115,"name":1739,"provider":3115,"aa_name":4274,"is_open":37,"author_country":2817,"release_date":1741,"release_month":1635,"context_length":115,"inference_mode":3250,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":60,"input_price":273,"output_price":60,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":1745,"benchmark_gpqa":857,"benchmark_hle":880,"benchmark_ifbench":3665,"benchmark_lcr":4030,"benchmark_livecodebench":1155,"benchmark_math_hard":12,"benchmark_mmlu_pro":1744,"benchmark_scicode":3928,"benchmark_tau2":145,"benchmark_terminalbench":174,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4268,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":4269,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2199,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":4270,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4271,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1155,"benchmark_mmlu_pro_reasoning":1744,"benchmark_gpqa_reasoning":857,"benchmark_aime_25_reasoning":1745,"benchmark_hle_reasoning":880,"benchmark_scicode_reasoning":3928,"benchmark_ifbench_reasoning":3665,"benchmark_lcr_reasoning":1079,"benchmark_terminalbench_reasoning":174,"benchmark_tau2_reasoning":145,"benchmark_intelligence":3366,"benchmark_coding":3961,"benchmark_intelligence_reasoning":906,"benchmark_coding_reasoning":28,"benchmark_math_reasoning":1745},"40635922-8173-46cc-9d1e-cb913a8801e6","DeepSeek V3.1 (Reasoning)",{"aa_id":4276,"ppt_model_id":4277,"slug":1748,"model_name":4278,"provider_name":2802,"name":1749,"provider":2802,"aa_name":4279,"is_open":37,"author_country":2653,"release_date":1751,"release_month":1635,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":68,"input_price":61,"output_price":68,"tokens_per_second":4280,"time_to_first_token":4281,"benchmark_aime":12,"benchmark_aime_25":2974,"benchmark_gpqa":1200,"benchmark_hle":2944,"benchmark_ifbench":1186,"benchmark_lcr":3337,"benchmark_livecodebench":4282,"benchmark_math_hard":12,"benchmark_mmlu_pro":4283,"benchmark_scicode":757,"benchmark_tau2":1420,"benchmark_terminalbench":3121,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4284,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4285,"benchmark_knights_and_knaves":12,"benchmark_math":1260,"benchmark_mbppplus":12,"benchmark_medqa":4286,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1754,"benchmark_mmlu_pro_reasoning":1753,"benchmark_gpqa_reasoning":1200,"benchmark_aime_25_reasoning":587,"benchmark_hle_reasoning":3029,"benchmark_scicode_reasoning":757,"benchmark_ifbench_reasoning":1186,"benchmark_lcr_reasoning":3337,"benchmark_terminalbench_reasoning":3121,"benchmark_tau2_reasoning":1420,"benchmark_intelligence":1556,"benchmark_coding":1701,"benchmark_intelligence_reasoning":1755,"benchmark_coding_reasoning":417,"benchmark_math_reasoning":587},"2276f7af-e1c3-4240-8ee7-b50a49e8b578","2660c652-4361-4c58-9341-afc7132bcdc3","Hermes 4 405B (Reasoning)","Hermes 4 - Llama-3.1 405B (Reasoning)",33.865,0.729,68.60000000000001,82.89999999999999,11.1504,75.4159,72.8201,{"aa_id":4288,"ppt_model_id":4277,"slug":1748,"model_name":1749,"provider_name":2802,"name":1749,"provider":2802,"aa_name":4289,"is_open":37,"author_country":2653,"release_date":1751,"release_month":1635,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":68,"input_price":61,"output_price":68,"tokens_per_second":4290,"time_to_first_token":4291,"benchmark_aime":12,"benchmark_aime_25":3206,"benchmark_gpqa":1752,"benchmark_hle":2752,"benchmark_ifbench":3429,"benchmark_lcr":436,"benchmark_livecodebench":1206,"benchmark_math_hard":12,"benchmark_mmlu_pro":4292,"benchmark_scicode":3960,"benchmark_tau2":723,"benchmark_terminalbench":2702,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4284,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4285,"benchmark_knights_and_knaves":12,"benchmark_math":1260,"benchmark_mbppplus":12,"benchmark_medqa":4286,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1754,"benchmark_mmlu_pro_reasoning":1753,"benchmark_gpqa_reasoning":1200,"benchmark_aime_25_reasoning":587,"benchmark_hle_reasoning":3029,"benchmark_scicode_reasoning":757,"benchmark_ifbench_reasoning":1186,"benchmark_lcr_reasoning":3337,"benchmark_terminalbench_reasoning":3121,"benchmark_tau2_reasoning":1420,"benchmark_intelligence":1556,"benchmark_coding":1701,"benchmark_intelligence_reasoning":1755,"benchmark_coding_reasoning":417,"benchmark_math_reasoning":587},"059cd54e-f613-4e94-a80d-2d84e65fd491","Hermes 4 - Llama-3.1 405B (Non-reasoning)",35.642,0.717,72.89999999999999,{"aa_id":4294,"ppt_model_id":4295,"slug":1758,"model_name":4296,"provider_name":2802,"name":1759,"provider":2802,"aa_name":4297,"is_open":37,"author_country":2653,"release_date":1761,"release_month":1635,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":536,"input_price":808,"output_price":536,"tokens_per_second":4298,"time_to_first_token":4299,"benchmark_aime":12,"benchmark_aime_25":749,"benchmark_gpqa":4300,"benchmark_hle":3325,"benchmark_ifbench":3239,"benchmark_lcr":429,"benchmark_livecodebench":1764,"benchmark_math_hard":12,"benchmark_mmlu_pro":3927,"benchmark_scicode":1344,"benchmark_tau2":4242,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4301,"benchmark_knights_and_knaves":12,"benchmark_math":4302,"benchmark_mbppplus":12,"benchmark_medqa":4303,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1764,"benchmark_mmlu_pro_reasoning":1453,"benchmark_gpqa_reasoning":1763,"benchmark_aime_25_reasoning":749,"benchmark_hle_reasoning":3325,"benchmark_scicode_reasoning":1344,"benchmark_ifbench_reasoning":3239,"benchmark_lcr_reasoning":429,"benchmark_terminalbench_reasoning":545,"benchmark_tau2_reasoning":4242,"benchmark_intelligence":1144,"benchmark_coding":4304,"benchmark_intelligence_reasoning":417,"benchmark_coding_reasoning":1765,"benchmark_math_reasoning":749},"58f78d8c-7b6f-4d13-b9c6-2e17e3c90a33","d3fda04f-325e-407c-b011-5b8dd68e747e","Hermes 4 70B (Reasoning)","Hermes 4 - Llama-3.1 70B (Reasoning)",82.828,0.592,69.89999999999999,68.5767,11.3,70.0707,9.2,{"aa_id":4306,"ppt_model_id":4295,"slug":1758,"model_name":1759,"provider_name":2802,"name":1759,"provider":2802,"aa_name":4307,"is_open":37,"author_country":2653,"release_date":1761,"release_month":1635,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":536,"input_price":808,"output_price":536,"tokens_per_second":4308,"time_to_first_token":4309,"benchmark_aime":12,"benchmark_aime_25":4302,"benchmark_gpqa":413,"benchmark_hle":2943,"benchmark_ifbench":3299,"benchmark_lcr":78,"benchmark_livecodebench":4310,"benchmark_math_hard":12,"benchmark_mmlu_pro":1121,"benchmark_scicode":3292,"benchmark_tau2":1899,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4301,"benchmark_knights_and_knaves":12,"benchmark_math":4302,"benchmark_mbppplus":12,"benchmark_medqa":4303,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1764,"benchmark_mmlu_pro_reasoning":1453,"benchmark_gpqa_reasoning":1763,"benchmark_aime_25_reasoning":749,"benchmark_hle_reasoning":3325,"benchmark_scicode_reasoning":1344,"benchmark_ifbench_reasoning":3239,"benchmark_lcr_reasoning":429,"benchmark_terminalbench_reasoning":545,"benchmark_tau2_reasoning":4242,"benchmark_intelligence":1144,"benchmark_coding":4304,"benchmark_intelligence_reasoning":417,"benchmark_coding_reasoning":1765,"benchmark_math_reasoning":749},"767f6f04-03e7-4a06-8922-e14dce7137f5","Hermes 4 - Llama-3.1 70B (Non-reasoning)",80.423,0.548,26.900000000000002,{"aa_id":4312,"ppt_model_id":4313,"slug":1768,"model_name":1769,"provider_name":3823,"name":1769,"provider":3823,"aa_name":1769,"is_open":11,"author_country":2653,"release_date":1771,"release_month":1635,"context_length":981,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":26,"input_price":377,"output_price":26,"tokens_per_second":4314,"time_to_first_token":4315,"benchmark_aime":12,"benchmark_aime_25":624,"benchmark_gpqa":1200,"benchmark_hle":99,"benchmark_ifbench":1510,"benchmark_lcr":201,"benchmark_livecodebench":1108,"benchmark_math_hard":12,"benchmark_mmlu_pro":1772,"benchmark_scicode":4316,"benchmark_tau2":1356,"benchmark_terminalbench":1191,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":624,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":983,"benchmark_coding":1113},"9de52516-4c02-4a68-924f-c6ab64986230","83f921d7-a506-4b80-bf69-8ef01d913f54",171.744,3.029,36.199999999999996,{"aa_id":4318,"ppt_model_id":4319,"slug":1781,"model_name":1782,"provider_name":3988,"name":1782,"provider":3988,"aa_name":4320,"is_open":37,"author_country":2817,"release_date":1784,"release_month":1785,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"tokens_per_second":4321,"time_to_first_token":4322,"benchmark_aime":12,"benchmark_aime_25":1710,"benchmark_gpqa":557,"benchmark_hle":1004,"benchmark_ifbench":2933,"benchmark_lcr":3118,"benchmark_livecodebench":1786,"benchmark_math_hard":12,"benchmark_mmlu_pro":3365,"benchmark_scicode":2896,"benchmark_tau2":869,"benchmark_terminalbench":3092,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4323,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4324,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1710,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2166,"benchmark_coding":301},"361c9538-889f-40b4-8afb-adcb230d6910","23151d75-d40a-4837-8ce4-cf07a940e054","Kimi K2 0905",39.843,0.816,80.6921,86.6994,{"aa_id":4326,"ppt_model_id":4327,"slug":1789,"model_name":4328,"provider_name":2892,"name":1790,"provider":2892,"aa_name":4329,"is_open":37,"author_country":2653,"release_date":1792,"release_month":1785,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":957,"input_price":208,"output_price":957,"tokens_per_second":4330,"time_to_first_token":4331,"benchmark_aime":12,"benchmark_aime_25":2974,"benchmark_gpqa":4004,"benchmark_hle":2776,"benchmark_ifbench":415,"benchmark_lcr":2683,"benchmark_livecodebench":3293,"benchmark_math_hard":12,"benchmark_mmlu_pro":1793,"benchmark_scicode":995,"benchmark_tau2":3143,"benchmark_terminalbench":26,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":858,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":902,"benchmark_mmlu_pro_reasoning":1793,"benchmark_gpqa_reasoning":1794,"benchmark_aime_25_reasoning":587,"benchmark_hle_reasoning":2776,"benchmark_scicode_reasoning":995,"benchmark_ifbench_reasoning":415,"benchmark_lcr_reasoning":2683,"benchmark_terminalbench_reasoning":26,"benchmark_tau2_reasoning":3143,"benchmark_intelligence":1242,"benchmark_coding":99,"benchmark_intelligence_reasoning":185,"benchmark_coding_reasoning":427,"benchmark_math_reasoning":587},"b6f43e02-6fee-4ce2-a720-7bd6168b3c7a","e46c3999-04d5-45a0-9fe1-c7136f4465d0","Nemotron Nano 9B V2 (Reasoning)","NVIDIA Nemotron Nano 9B V2 (Reasoning)",158.685,0.193,{"aa_id":4333,"ppt_model_id":4327,"slug":1789,"model_name":1790,"provider_name":2892,"name":1790,"provider":2892,"aa_name":4334,"is_open":37,"author_country":2653,"release_date":1792,"release_month":1785,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":957,"input_price":208,"output_price":957,"tokens_per_second":4335,"time_to_first_token":4336,"benchmark_aime":12,"benchmark_aime_25":858,"benchmark_gpqa":915,"benchmark_hle":69,"benchmark_ifbench":2935,"benchmark_lcr":4094,"benchmark_livecodebench":566,"benchmark_math_hard":12,"benchmark_mmlu_pro":745,"benchmark_scicode":3898,"benchmark_tau2":2744,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":858,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":902,"benchmark_mmlu_pro_reasoning":1793,"benchmark_gpqa_reasoning":1794,"benchmark_aime_25_reasoning":587,"benchmark_hle_reasoning":2776,"benchmark_scicode_reasoning":995,"benchmark_ifbench_reasoning":415,"benchmark_lcr_reasoning":2683,"benchmark_terminalbench_reasoning":26,"benchmark_tau2_reasoning":3143,"benchmark_intelligence":1242,"benchmark_coding":99,"benchmark_intelligence_reasoning":185,"benchmark_coding_reasoning":427,"benchmark_math_reasoning":587},"cd62c847-30bc-4471-a1a7-dea9e7faef84","NVIDIA Nemotron Nano 9B V2 (Non-reasoning)",165.734,0.843,{"aa_id":4338,"ppt_model_id":4339,"slug":1810,"model_name":1811,"provider_name":1833,"name":1811,"provider":1833,"aa_name":1811,"is_open":37,"author_country":2817,"release_date":1813,"release_month":1785,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":794,"input_price":404,"output_price":794,"tokens_per_second":4340,"time_to_first_token":4341,"benchmark_aime":12,"benchmark_aime_25":3991,"benchmark_gpqa":1608,"benchmark_hle":3148,"benchmark_ifbench":1069,"benchmark_lcr":4031,"benchmark_livecodebench":1598,"benchmark_math_hard":12,"benchmark_mmlu_pro":3365,"benchmark_scicode":2896,"benchmark_tau2":1899,"benchmark_terminalbench":3413,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3991,"benchmark_mbppplus":3186,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":4342,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4343,"benchmark_coding":1260},"bf04d158-eb24-437d-b7c0-196ef0ccd433","ed0c7392-c8de-490f-b11b-8ee2b14bec3e",166.56,0.971,40.1294,20.1,{"aa_id":12,"ppt_model_id":4345,"slug":1831,"model_name":1832,"provider_name":1833,"name":1832,"provider":1833,"aa_name":12,"is_open":37,"author_country":2817,"release_date":1835,"release_month":1785,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":536,"input_price":404,"output_price":536,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4346,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":4347,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":4348,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"d3b02fa0-cf7a-4cf9-81d2-338006b1b311",84.8247,20.625,11.8613,{"aa_id":4350,"ppt_model_id":4351,"slug":1838,"model_name":4352,"provider_name":3823,"name":1839,"provider":3823,"aa_name":4352,"is_open":11,"author_country":2653,"release_date":1841,"release_month":1785,"context_length":1842,"inference_mode":3250,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":25,"input_price":377,"output_price":25,"tokens_per_second":4353,"time_to_first_token":4354,"benchmark_aime":12,"benchmark_aime_25":1745,"benchmark_gpqa":1844,"benchmark_hle":2098,"benchmark_ifbench":567,"benchmark_lcr":3759,"benchmark_livecodebench":1154,"benchmark_math_hard":12,"benchmark_mmlu_pro":889,"benchmark_scicode":2497,"benchmark_tau2":4137,"benchmark_terminalbench":2711,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4355,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4356,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3926,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4357,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":570,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1154,"benchmark_mmlu_pro_reasoning":889,"benchmark_gpqa_reasoning":1844,"benchmark_aime_25_reasoning":1745,"benchmark_hle_reasoning":2098,"benchmark_scicode_reasoning":2497,"benchmark_ifbench_reasoning":567,"benchmark_lcr_reasoning":3759,"benchmark_terminalbench_reasoning":2711,"benchmark_tau2_reasoning":4137,"benchmark_intelligence":689,"benchmark_coding":1243,"benchmark_intelligence_reasoning":131,"benchmark_coding_reasoning":1845,"benchmark_math_reasoning":1745},"84ae7f99-97f8-444f-a91e-ecac4cc579f5","ab77382c-ccd4-43f2-8f43-d147e72c6383","Grok 4 Fast (Reasoning)",144.879,4.004,88.8845,89.3258,60.4444,{"aa_id":4359,"ppt_model_id":4351,"slug":1838,"model_name":1839,"provider_name":3823,"name":1839,"provider":3823,"aa_name":4360,"is_open":11,"author_country":2653,"release_date":1841,"release_month":1785,"context_length":1842,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":25,"input_price":377,"output_price":25,"tokens_per_second":4361,"time_to_first_token":3157,"benchmark_aime":12,"benchmark_aime_25":3926,"benchmark_gpqa":1843,"benchmark_hle":505,"benchmark_ifbench":3692,"benchmark_lcr":436,"benchmark_livecodebench":360,"benchmark_math_hard":12,"benchmark_mmlu_pro":1211,"benchmark_scicode":1923,"benchmark_tau2":2163,"benchmark_terminalbench":3245,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4362,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4363,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3926,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1154,"benchmark_mmlu_pro_reasoning":889,"benchmark_gpqa_reasoning":1844,"benchmark_aime_25_reasoning":1745,"benchmark_hle_reasoning":2098,"benchmark_scicode_reasoning":2497,"benchmark_ifbench_reasoning":567,"benchmark_lcr_reasoning":3759,"benchmark_terminalbench_reasoning":2711,"benchmark_tau2_reasoning":4137,"benchmark_intelligence":689,"benchmark_coding":1243,"benchmark_intelligence_reasoning":131,"benchmark_coding_reasoning":1845,"benchmark_math_reasoning":1745},"afcd525f-9d02-4b2b-8b19-3f3f243749ca","Grok 4 Fast (Non-reasoning)",131.013,88.6489,89.6483,{"aa_id":4365,"ppt_model_id":4366,"slug":1848,"model_name":4367,"provider_name":3115,"name":1849,"provider":3115,"aa_name":4367,"is_open":37,"author_country":2817,"release_date":1851,"release_month":1785,"context_length":670,"inference_mode":3250,"input_price_per_1m_tokens":1852,"output_price_per_1m_tokens":1853,"input_price":1852,"output_price":1853,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":1745,"benchmark_gpqa":1854,"benchmark_hle":1986,"benchmark_ifbench":4004,"benchmark_lcr":4368,"benchmark_livecodebench":3604,"benchmark_math_hard":12,"benchmark_mmlu_pro":1744,"benchmark_scicode":1239,"benchmark_tau2":2022,"benchmark_terminalbench":1203,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4369,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4370,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":183,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1204,"benchmark_mmlu_pro_reasoning":1744,"benchmark_gpqa_reasoning":1854,"benchmark_aime_25_reasoning":1745,"benchmark_hle_reasoning":1986,"benchmark_scicode_reasoning":1239,"benchmark_ifbench_reasoning":1794,"benchmark_lcr_reasoning":4368,"benchmark_terminalbench_reasoning":1203,"benchmark_tau2_reasoning":2022,"benchmark_intelligence":3678,"benchmark_coding":3865,"benchmark_intelligence_reasoning":1143,"benchmark_coding_reasoning":917,"benchmark_math_reasoning":1745},"598db0b6-bee6-43d5-b1e6-c16363f40634","e509f593-273b-4b8b-8dbb-9b5f56732663","DeepSeek V3.1 Terminus (Reasoning)",65,84.7151,60.4669,{"aa_id":4372,"ppt_model_id":4366,"slug":1848,"model_name":1849,"provider_name":3115,"name":1849,"provider":3115,"aa_name":4373,"is_open":37,"author_country":2817,"release_date":1851,"release_month":1785,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":1852,"output_price_per_1m_tokens":1853,"input_price":1852,"output_price":1853,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":183,"benchmark_gpqa":1709,"benchmark_hle":4374,"benchmark_ifbench":3891,"benchmark_lcr":624,"benchmark_livecodebench":3358,"benchmark_math_hard":12,"benchmark_mmlu_pro":1375,"benchmark_scicode":3847,"benchmark_tau2":2022,"benchmark_terminalbench":2349,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4369,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4370,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":183,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1204,"benchmark_mmlu_pro_reasoning":1744,"benchmark_gpqa_reasoning":1854,"benchmark_aime_25_reasoning":1745,"benchmark_hle_reasoning":1986,"benchmark_scicode_reasoning":1239,"benchmark_ifbench_reasoning":1794,"benchmark_lcr_reasoning":4368,"benchmark_terminalbench_reasoning":1203,"benchmark_tau2_reasoning":2022,"benchmark_intelligence":3678,"benchmark_coding":3865,"benchmark_intelligence_reasoning":1143,"benchmark_coding_reasoning":917,"benchmark_math_reasoning":1745},"8716feea-dc5d-454d-98cc-c1713c89b7fe","DeepSeek V3.1 Terminus (Non-reasoning)",8.4,{"aa_id":4376,"ppt_model_id":4377,"slug":1857,"model_name":1858,"provider_name":9,"name":1858,"provider":9,"aa_name":4378,"is_open":11,"author_country":2653,"release_date":1860,"release_month":1785,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"tokens_per_second":4379,"time_to_first_token":4380,"benchmark_aime":12,"benchmark_aime_25":4213,"benchmark_gpqa":891,"benchmark_hle":3555,"benchmark_ifbench":2339,"benchmark_lcr":483,"benchmark_livecodebench":1190,"benchmark_math_hard":12,"benchmark_mmlu_pro":1861,"benchmark_scicode":326,"benchmark_tau2":2348,"benchmark_terminalbench":198,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4213,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4381,"benchmark_coding":4136},"a065b939-8c45-4c91-9bd5-13cc520dba5b","428b287e-a32e-48f1-9a96-0371e6f7a0f8","GPT-5 Codex (high)",161.538,6.957,44.6,{"aa_id":4383,"ppt_model_id":4384,"slug":1871,"model_name":1872,"provider_name":1833,"name":1872,"provider":1833,"aa_name":1872,"is_open":11,"author_country":2817,"release_date":1874,"release_month":1785,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":794,"output_price_per_1m_tokens":1875,"input_price":794,"output_price":1875,"tokens_per_second":4385,"time_to_first_token":4386,"benchmark_aime":12,"benchmark_aime_25":1208,"benchmark_gpqa":1876,"benchmark_hle":1636,"benchmark_ifbench":30,"benchmark_lcr":1454,"benchmark_livecodebench":557,"benchmark_math_hard":12,"benchmark_mmlu_pro":652,"benchmark_scicode":388,"benchmark_tau2":1237,"benchmark_terminalbench":3061,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":3729,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4387,"benchmark_bfcl_v3":4388,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1351,"benchmark_mbppplus":12,"benchmark_medqa":4389,"benchmark_mmlu":12,"benchmark_mmmu":4390,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":568,"benchmark_coding":426},"6895b9be-4765-40ce-aa8f-f3374ad3c065","6527c4b8-0b63-4794-b99f-920da57f1a50",32.766,1.857,92.5664,74.8705,85.4674,57.4444,{"aa_id":4392,"ppt_model_id":4384,"slug":1871,"model_name":1872,"provider_name":1833,"name":1872,"provider":1833,"aa_name":4393,"is_open":11,"author_country":2817,"release_date":1874,"release_month":1785,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":794,"output_price_per_1m_tokens":1875,"input_price":794,"output_price":1875,"tokens_per_second":4394,"time_to_first_token":4395,"benchmark_aime":12,"benchmark_aime_25":1351,"benchmark_gpqa":1876,"benchmark_hle":450,"benchmark_ifbench":4396,"benchmark_lcr":1069,"benchmark_livecodebench":4123,"benchmark_math_hard":12,"benchmark_mmlu_pro":1677,"benchmark_scicode":4397,"benchmark_tau2":1186,"benchmark_terminalbench":2295,"benchmark_accountingaudit":2796,"benchmark_agieval_zh":12,"benchmark_agieval_en":3729,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4387,"benchmark_bfcl_v3":4388,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1351,"benchmark_mbppplus":12,"benchmark_medqa":4389,"benchmark_mmlu":12,"benchmark_mmmu":4390,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":568,"benchmark_coding":426},"a240bdd0-0bce-4f6e-a4af-90a2755127d5","Qwen3 Max (Preview)",41.034,1.735,48,37,{"aa_id":4399,"ppt_model_id":4400,"slug":1880,"model_name":1881,"provider_name":1833,"name":1881,"provider":1833,"aa_name":1881,"is_open":37,"author_country":2817,"release_date":1883,"release_month":1785,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":1884,"input_price":377,"output_price":1884,"tokens_per_second":4401,"time_to_first_token":4402,"benchmark_aime":12,"benchmark_aime_25":1024,"benchmark_gpqa":982,"benchmark_hle":1004,"benchmark_ifbench":4403,"benchmark_lcr":2096,"benchmark_livecodebench":636,"benchmark_math_hard":12,"benchmark_mmlu_pro":1419,"benchmark_scicode":784,"benchmark_tau2":2674,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4404,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1024,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4405,"benchmark_multichallenge":12,"benchmark_simpleqa":4406,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2676,"benchmark_coding":1210},"d824b865-b8cd-499e-8203-164d4e6d0594","6d91ae14-b728-418b-a5aa-a11b119c3f32",57.514,1.051,42.699999999999996,80.7148,68.1514,46.6667,{"aa_id":12,"ppt_model_id":4408,"slug":1887,"model_name":1888,"provider_name":375,"name":1888,"provider":375,"aa_name":12,"is_open":37,"author_country":2817,"release_date":1890,"release_month":1785,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":312,"input_price":793,"output_price":312,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":4409,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"f55630ea-8e61-4068-b933-847cf24caa6c",37.8648,{"aa_id":4411,"ppt_model_id":4412,"slug":1893,"model_name":4413,"provider_name":248,"name":1894,"provider":248,"aa_name":4414,"is_open":11,"author_country":2653,"release_date":1896,"release_month":1785,"context_length":856,"inference_mode":3250,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":4415,"time_to_first_token":4416,"benchmark_aime":12,"benchmark_aime_25":749,"benchmark_gpqa":4417,"benchmark_hle":2668,"benchmark_ifbench":4418,"benchmark_lcr":623,"benchmark_livecodebench":1652,"benchmark_math_hard":12,"benchmark_mmlu_pro":3562,"benchmark_scicode":983,"benchmark_tau2":2896,"benchmark_terminalbench":2936,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1454,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1652,"benchmark_mmlu_pro_reasoning":1167,"benchmark_gpqa_reasoning":1898,"benchmark_aime_25_reasoning":749,"benchmark_hle_reasoning":120,"benchmark_scicode_reasoning":983,"benchmark_ifbench_reasoning":4418,"benchmark_lcr_reasoning":623,"benchmark_terminalbench_reasoning":2936,"benchmark_tau2_reasoning":2896,"benchmark_intelligence":4102,"benchmark_coding":2768,"benchmark_intelligence_reasoning":1899,"benchmark_coding_reasoning":1701,"benchmark_math_reasoning":749},"30307f16-3a13-4f9c-af3e-67f54b6de3d3","96c17ad8-9224-4e8d-86a0-92f2f075f465","Gemini 2.5 Flash Lite Preview 09-2025 (Reasoning)","Gemini 2.5 Flash-Lite Preview (Sep '25) (Reasoning)",348.092,9.268,70.89999999999999,52.6,{"aa_id":4420,"ppt_model_id":4412,"slug":1893,"model_name":1894,"provider_name":248,"name":1894,"provider":248,"aa_name":4421,"is_open":11,"author_country":2653,"release_date":1896,"release_month":1785,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":4422,"time_to_first_token":4423,"benchmark_aime":12,"benchmark_aime_25":1454,"benchmark_gpqa":4123,"benchmark_hle":2776,"benchmark_ifbench":1662,"benchmark_lcr":4396,"benchmark_livecodebench":1897,"benchmark_math_hard":12,"benchmark_mmlu_pro":3785,"benchmark_scicode":3667,"benchmark_tau2":2860,"benchmark_terminalbench":3413,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1454,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1652,"benchmark_mmlu_pro_reasoning":1167,"benchmark_gpqa_reasoning":1898,"benchmark_aime_25_reasoning":749,"benchmark_hle_reasoning":120,"benchmark_scicode_reasoning":983,"benchmark_ifbench_reasoning":4418,"benchmark_lcr_reasoning":623,"benchmark_terminalbench_reasoning":2936,"benchmark_tau2_reasoning":2896,"benchmark_intelligence":4102,"benchmark_coding":2768,"benchmark_intelligence_reasoning":1899,"benchmark_coding_reasoning":1701,"benchmark_math_reasoning":749},"fd7595e8-aac2-49df-b70f-ce6cb39ec059","Gemini 2.5 Flash-Lite Preview (Sep '25) (Non-reasoning)",353.496,0.435,{"aa_id":4425,"ppt_model_id":4426,"slug":1915,"model_name":4427,"provider_name":3115,"name":1916,"provider":3115,"aa_name":4427,"is_open":37,"author_country":2817,"release_date":1918,"release_month":1785,"context_length":670,"inference_mode":3250,"input_price_per_1m_tokens":1626,"output_price_per_1m_tokens":1919,"input_price":1626,"output_price":1919,"tokens_per_second":4428,"time_to_first_token":4429,"benchmark_aime":12,"benchmark_aime_25":1500,"benchmark_gpqa":1921,"benchmark_hle":1209,"benchmark_ifbench":602,"benchmark_lcr":483,"benchmark_livecodebench":279,"benchmark_math_hard":12,"benchmark_mmlu_pro":889,"benchmark_scicode":3692,"benchmark_tau2":3546,"benchmark_terminalbench":3761,"benchmark_accountingaudit":12,"benchmark_agieval_zh":4430,"benchmark_agieval_en":4431,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4432,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4433,"benchmark_knights_and_knaves":12,"benchmark_math":1700,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1793,"benchmark_livecodebench_reasoning":279,"benchmark_mmlu_pro_reasoning":889,"benchmark_gpqa_reasoning":1921,"benchmark_aime_25_reasoning":1500,"benchmark_hle_reasoning":1209,"benchmark_scicode_reasoning":3692,"benchmark_ifbench_reasoning":602,"benchmark_lcr_reasoning":483,"benchmark_terminalbench_reasoning":3761,"benchmark_tau2_reasoning":1143,"benchmark_intelligence":3961,"benchmark_coding":16,"benchmark_intelligence_reasoning":1923,"benchmark_coding_reasoning":1922,"benchmark_math_reasoning":1500},"75b3a070-7c0a-4038-9b8e-a939d6e493f5","8b2f0200-9b1d-4aae-b693-c74ff2d2b009","DeepSeek V3.2 Exp (Reasoning)",34.841,1.318,90.1053,89.0024,87.9742,88.1481,{"aa_id":4435,"ppt_model_id":4426,"slug":1915,"model_name":1916,"provider_name":3115,"name":1916,"provider":3115,"aa_name":4436,"is_open":37,"author_country":2817,"release_date":1918,"release_month":1785,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":1626,"output_price_per_1m_tokens":1919,"input_price":1626,"output_price":1919,"tokens_per_second":4437,"time_to_first_token":4438,"benchmark_aime":12,"benchmark_aime_25":4232,"benchmark_gpqa":1608,"benchmark_hle":4439,"benchmark_ifbench":4440,"benchmark_lcr":1124,"benchmark_livecodebench":4110,"benchmark_math_hard":12,"benchmark_mmlu_pro":1375,"benchmark_scicode":3176,"benchmark_tau2":3546,"benchmark_terminalbench":174,"benchmark_accountingaudit":12,"benchmark_agieval_zh":4441,"benchmark_agieval_en":4442,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4443,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4433,"benchmark_knights_and_knaves":12,"benchmark_math":1700,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_aider":1793,"benchmark_livecodebench_reasoning":279,"benchmark_mmlu_pro_reasoning":889,"benchmark_gpqa_reasoning":1921,"benchmark_aime_25_reasoning":1500,"benchmark_hle_reasoning":1209,"benchmark_scicode_reasoning":3692,"benchmark_ifbench_reasoning":602,"benchmark_lcr_reasoning":483,"benchmark_terminalbench_reasoning":3761,"benchmark_tau2_reasoning":1143,"benchmark_intelligence":3961,"benchmark_coding":16,"benchmark_intelligence_reasoning":1923,"benchmark_coding_reasoning":1922,"benchmark_math_reasoning":1500},"255db3f6-b52b-4518-a13e-e85ab74632b8","DeepSeek V3.2 Exp (Non-reasoning)",35.683,1.414,8.6,43.1,85.837,85.6638,52.8183,{"aa_id":4445,"ppt_model_id":4446,"slug":1926,"model_name":4447,"provider_name":138,"name":1927,"provider":138,"aa_name":4448,"is_open":11,"author_country":2653,"release_date":1929,"release_month":1785,"context_length":792,"inference_mode":3250,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":4449,"time_to_first_token":4450,"benchmark_aime":12,"benchmark_aime_25":1643,"benchmark_gpqa":4451,"benchmark_hle":2775,"benchmark_ifbench":1710,"benchmark_lcr":1108,"benchmark_livecodebench":2945,"benchmark_math_hard":12,"benchmark_mmlu_pro":1930,"benchmark_scicode":4452,"benchmark_tau2":3516,"benchmark_terminalbench":4453,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4454,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4455,"benchmark_bbh":4456,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":4457,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4397,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4458,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":569,"benchmark_mmlu_pro_reasoning":1930,"benchmark_gpqa_reasoning":1931,"benchmark_aime_25_reasoning":1643,"benchmark_hle_reasoning":330,"benchmark_scicode_reasoning":4452,"benchmark_ifbench_reasoning":1710,"benchmark_lcr_reasoning":1108,"benchmark_terminalbench_reasoning":4453,"benchmark_tau2_reasoning":1120,"benchmark_intelligence":2022,"benchmark_coding":3648,"benchmark_intelligence_reasoning":1124,"benchmark_coding_reasoning":1932,"benchmark_math_reasoning":1643},"4fc7fd80-7682-4bd2-992a-d309a21fa8a6","ef5ef4f0-abae-4919-af67-c859fce6b0df","Claude Sonnet 4.5 (Reasoning)","Claude 4.5 Sonnet (Reasoning)",46.097,8.526,83.39999999999999,44.7,35.6,85.978,37.1068,94.3941,97.561,72.8889,{"aa_id":4460,"ppt_model_id":4446,"slug":1926,"model_name":1927,"provider_name":138,"name":1927,"provider":138,"aa_name":4461,"is_open":11,"author_country":2653,"release_date":1929,"release_month":1785,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":4462,"time_to_first_token":4463,"benchmark_aime":12,"benchmark_aime_25":4397,"benchmark_gpqa":1200,"benchmark_hle":3651,"benchmark_ifbench":4403,"benchmark_lcr":4031,"benchmark_livecodebench":623,"benchmark_math_hard":12,"benchmark_mmlu_pro":871,"benchmark_scicode":959,"benchmark_tau2":4464,"benchmark_terminalbench":3053,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4465,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4466,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4397,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4467,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":569,"benchmark_mmlu_pro_reasoning":1930,"benchmark_gpqa_reasoning":1931,"benchmark_aime_25_reasoning":1643,"benchmark_hle_reasoning":330,"benchmark_scicode_reasoning":4452,"benchmark_ifbench_reasoning":1710,"benchmark_lcr_reasoning":1108,"benchmark_terminalbench_reasoning":4453,"benchmark_tau2_reasoning":1120,"benchmark_intelligence":2022,"benchmark_coding":3648,"benchmark_intelligence_reasoning":1124,"benchmark_coding_reasoning":1932,"benchmark_math_reasoning":1643},"eccd28a2-7b42-4952-94a5-aea9ea4cdcbd","Claude 4.5 Sonnet (Non-reasoning)",46.284,1.082,70.5,85.7423,94.302,71.6667,{"aa_id":4469,"ppt_model_id":4470,"slug":1935,"model_name":4471,"provider_name":4066,"name":1936,"provider":4066,"aa_name":4472,"is_open":37,"author_country":2653,"release_date":1938,"release_month":1785,"context_length":1939,"inference_mode":3250,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":1940,"input_price":324,"output_price":1940,"tokens_per_second":4473,"time_to_first_token":4474,"benchmark_aime":12,"benchmark_aime_25":871,"benchmark_gpqa":1943,"benchmark_hle":3679,"benchmark_ifbench":4475,"benchmark_lcr":4476,"benchmark_livecodebench":1417,"benchmark_math_hard":12,"benchmark_mmlu_pro":4283,"benchmark_scicode":3566,"benchmark_tau2":4464,"benchmark_terminalbench":174,"benchmark_accountingaudit":12,"benchmark_agieval_zh":4477,"benchmark_agieval_en":4478,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4479,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3775,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1645,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1417,"benchmark_mmlu_pro_reasoning":1753,"benchmark_gpqa_reasoning":1943,"benchmark_aime_25_reasoning":871,"benchmark_hle_reasoning":3679,"benchmark_scicode_reasoning":3566,"benchmark_ifbench_reasoning":4475,"benchmark_lcr_reasoning":4480,"benchmark_terminalbench_reasoning":174,"benchmark_tau2_reasoning":4464,"benchmark_intelligence":2908,"benchmark_coding":2908,"benchmark_intelligence_reasoning":1944,"benchmark_coding_reasoning":556,"benchmark_math_reasoning":871},"c83b6f29-3107-4557-951d-007d950211f4","107762b9-fbdd-4109-a79b-3947204d1d99","GLM 4.6 (Reasoning)","GLM-4.6 (Reasoning)",62.118,0.763,43.4,54.300000000000004,88.1619,88.6364,85.5304,54.3,{"aa_id":4482,"ppt_model_id":4470,"slug":1935,"model_name":1936,"provider_name":4066,"name":1936,"provider":4066,"aa_name":4483,"is_open":37,"author_country":2653,"release_date":1938,"release_month":1785,"context_length":1939,"inference_mode":2654,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":1940,"input_price":324,"output_price":1940,"tokens_per_second":4484,"time_to_first_token":4485,"benchmark_aime":12,"benchmark_aime_25":3775,"benchmark_gpqa":1941,"benchmark_hle":2835,"benchmark_ifbench":1686,"benchmark_lcr":1610,"benchmark_livecodebench":4486,"benchmark_math_hard":12,"benchmark_mmlu_pro":1155,"benchmark_scicode":2733,"benchmark_tau2":1314,"benchmark_terminalbench":3053,"benchmark_accountingaudit":12,"benchmark_agieval_zh":4477,"benchmark_agieval_en":4478,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4479,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3775,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1645,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1417,"benchmark_mmlu_pro_reasoning":1753,"benchmark_gpqa_reasoning":1943,"benchmark_aime_25_reasoning":871,"benchmark_hle_reasoning":3679,"benchmark_scicode_reasoning":3566,"benchmark_ifbench_reasoning":4475,"benchmark_lcr_reasoning":4480,"benchmark_terminalbench_reasoning":174,"benchmark_tau2_reasoning":4464,"benchmark_intelligence":2908,"benchmark_coding":2908,"benchmark_intelligence_reasoning":1944,"benchmark_coding_reasoning":556,"benchmark_math_reasoning":871},"50564bc8-c104-4cfa-b596-d206bfa43dbc","GLM-4.6 (Non-reasoning)",64.015,0.955,56.10000000000001,{"aa_id":4488,"ppt_model_id":4489,"slug":1955,"model_name":1956,"provider_name":1833,"name":1956,"provider":1833,"aa_name":1956,"is_open":37,"author_country":2817,"release_date":1958,"release_month":1951,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":808,"output_price_per_1m_tokens":819,"input_price":808,"output_price":819,"tokens_per_second":4490,"time_to_first_token":3603,"benchmark_aime":12,"benchmark_aime_25":656,"benchmark_gpqa":1417,"benchmark_hle":2722,"benchmark_ifbench":2733,"benchmark_lcr":1113,"benchmark_livecodebench":2791,"benchmark_math_hard":12,"benchmark_mmlu_pro":1876,"benchmark_scicode":3060,"benchmark_tau2":1243,"benchmark_terminalbench":2975,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":656,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4491,"benchmark_coding":691},"04883fc5-446a-4306-b809-75a933ccc0a6","dbdaca45-9dc0-4df6-81dd-c2b0c8776fd2",127.283,16.1,{"aa_id":4493,"ppt_model_id":4494,"slug":1979,"model_name":4495,"provider_name":2892,"name":1980,"provider":2892,"aa_name":4496,"is_open":11,"author_country":2653,"release_date":1982,"release_month":1951,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":4497,"time_to_first_token":4498,"benchmark_aime":871,"benchmark_aime_25":557,"benchmark_gpqa":767,"benchmark_hle":2753,"benchmark_ifbench":4397,"benchmark_lcr":1357,"benchmark_livecodebench":160,"benchmark_math_hard":1367,"benchmark_mmlu_pro":4499,"benchmark_scicode":3429,"benchmark_tau2":3366,"benchmark_terminalbench":1146,"benchmark_accountingaudit":3478,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4500,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":615,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":160,"benchmark_mmlu_pro_reasoning":1985,"benchmark_gpqa_reasoning":767,"benchmark_math_hard_reasoning":1367,"benchmark_aime_reasoning":871,"benchmark_aime_25_reasoning":557,"benchmark_hle_reasoning":1014,"benchmark_scicode_reasoning":3429,"benchmark_ifbench_reasoning":4397,"benchmark_lcr_reasoning":1357,"benchmark_terminalbench_reasoning":1146,"benchmark_tau2_reasoning":3366,"benchmark_intelligence":1332,"benchmark_coding":2322,"benchmark_intelligence_reasoning":1987,"benchmark_coding_reasoning":1986,"benchmark_math_reasoning":557},"c233c167-ad99-4097-8530-acbf74f8d0b2","205a6ca0-39ce-4107-80f5-4ae2732ed82d","Llama 3.3 Nemotron Super 49B V1.5 (Reasoning)","Llama Nemotron Super 49B v1.5 (Reasoning)",63.803,0.327,81.39999999999999,25.3333,{"aa_id":4502,"ppt_model_id":4494,"slug":1979,"model_name":1980,"provider_name":2892,"name":1980,"provider":2892,"aa_name":4503,"is_open":11,"author_country":2653,"release_date":1982,"release_month":1951,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":536,"input_price":495,"output_price":536,"tokens_per_second":4504,"time_to_first_token":4505,"benchmark_aime":3338,"benchmark_aime_25":615,"benchmark_gpqa":1984,"benchmark_hle":2787,"benchmark_ifbench":1923,"benchmark_lcr":995,"benchmark_livecodebench":3299,"benchmark_math_hard":771,"benchmark_mmlu_pro":4506,"benchmark_scicode":4507,"benchmark_tau2":3412,"benchmark_terminalbench":2934,"benchmark_accountingaudit":3478,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4500,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":615,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":160,"benchmark_mmlu_pro_reasoning":1985,"benchmark_gpqa_reasoning":767,"benchmark_math_hard_reasoning":1367,"benchmark_aime_reasoning":871,"benchmark_aime_25_reasoning":557,"benchmark_hle_reasoning":1014,"benchmark_scicode_reasoning":3429,"benchmark_ifbench_reasoning":4397,"benchmark_lcr_reasoning":1357,"benchmark_terminalbench_reasoning":1146,"benchmark_tau2_reasoning":3366,"benchmark_intelligence":1332,"benchmark_coding":2322,"benchmark_intelligence_reasoning":1987,"benchmark_coding_reasoning":1986,"benchmark_math_reasoning":557},"d852252c-2af6-49b8-aeef-dc675d74b579","Llama Nemotron Super 49B v1.5 (Non-reasoning)",64.828,0.317,69.19999999999999,23.799999999999997,{"aa_id":4509,"ppt_model_id":4510,"slug":2002,"model_name":2003,"provider_name":1833,"name":2003,"provider":1833,"aa_name":2003,"is_open":37,"author_country":2817,"release_date":2005,"release_month":1951,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":251,"output_price_per_1m_tokens":377,"input_price":251,"output_price":377,"tokens_per_second":4511,"time_to_first_token":4512,"benchmark_aime":12,"benchmark_aime_25":3777,"benchmark_gpqa":4403,"benchmark_hle":2731,"benchmark_ifbench":3906,"benchmark_lcr":3206,"benchmark_livecodebench":184,"benchmark_math_hard":12,"benchmark_mmlu_pro":4282,"benchmark_scicode":1191,"benchmark_tau2":119,"benchmark_terminalbench":363,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3777,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":691,"benchmark_coding":3148},"7b9e0f9a-8e35-47f9-85f9-cde966e60018","f331ac5a-07c5-480b-988d-277947d6b5d0",143.676,1.013,{"aa_id":4514,"ppt_model_id":4515,"slug":2017,"model_name":4516,"provider_name":138,"name":2018,"provider":138,"aa_name":4517,"is_open":11,"author_country":2653,"release_date":2020,"release_month":1951,"context_length":142,"inference_mode":3250,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":505,"input_price":61,"output_price":505,"tokens_per_second":4518,"time_to_first_token":4519,"benchmark_aime":12,"benchmark_aime_25":891,"benchmark_gpqa":1661,"benchmark_hle":3014,"benchmark_ifbench":4476,"benchmark_lcr":316,"benchmark_livecodebench":746,"benchmark_math_hard":12,"benchmark_mmlu_pro":1322,"benchmark_scicode":624,"benchmark_tau2":3254,"benchmark_terminalbench":3777,"benchmark_accountingaudit":3478,"benchmark_agieval_zh":12,"benchmark_agieval_en":4520,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4521,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1071,"benchmark_mbppplus":4522,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4523,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2924,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":746,"benchmark_mmlu_pro_reasoning":1322,"benchmark_gpqa_reasoning":1661,"benchmark_aime_25_reasoning":891,"benchmark_hle_reasoning":985,"benchmark_scicode_reasoning":624,"benchmark_ifbench_reasoning":4480,"benchmark_lcr_reasoning":316,"benchmark_terminalbench_reasoning":3777,"benchmark_tau2_reasoning":3254,"benchmark_intelligence":3761,"benchmark_coding":210,"benchmark_intelligence_reasoning":2022,"benchmark_coding_reasoning":1111,"benchmark_math_reasoning":891},"acc45090-203a-4286-b13a-6085792b0634","947b1bae-ffaa-4b35-9530-0f3dd4841fd6","Claude Haiku 4.5 (Reasoning)","Claude 4.5 Haiku (Reasoning)",107.805,12.109,76.9442,81.9843,53.4392,65.2222,{"aa_id":4525,"ppt_model_id":4515,"slug":2017,"model_name":2018,"provider_name":138,"name":2018,"provider":138,"aa_name":4526,"is_open":11,"author_country":2653,"release_date":2020,"release_month":1951,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":61,"output_price_per_1m_tokens":505,"input_price":61,"output_price":505,"tokens_per_second":4527,"time_to_first_token":4528,"benchmark_aime":12,"benchmark_aime_25":1071,"benchmark_gpqa":3760,"benchmark_hle":2787,"benchmark_ifbench":1645,"benchmark_lcr":1136,"benchmark_livecodebench":1012,"benchmark_math_hard":12,"benchmark_mmlu_pro":1398,"benchmark_scicode":2045,"benchmark_tau2":1944,"benchmark_terminalbench":3777,"benchmark_accountingaudit":3478,"benchmark_agieval_zh":12,"benchmark_agieval_en":4520,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4521,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":4529,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1071,"benchmark_mbppplus":4522,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4523,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2924,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":746,"benchmark_mmlu_pro_reasoning":1322,"benchmark_gpqa_reasoning":1661,"benchmark_aime_25_reasoning":891,"benchmark_hle_reasoning":985,"benchmark_scicode_reasoning":624,"benchmark_ifbench_reasoning":4480,"benchmark_lcr_reasoning":316,"benchmark_terminalbench_reasoning":3777,"benchmark_tau2_reasoning":3254,"benchmark_intelligence":3761,"benchmark_coding":210,"benchmark_intelligence_reasoning":2022,"benchmark_coding_reasoning":1111,"benchmark_math_reasoning":891},"43826d84-f0fe-415d-84d1-279fc0b532fc","Claude 4.5 Haiku (Non-reasoning)",98.68,0.504,93.9024,{"aa_id":4531,"ppt_model_id":4532,"slug":2041,"model_name":2042,"provider_name":4533,"name":2042,"provider":4533,"aa_name":4534,"is_open":37,"author_country":2653,"release_date":2044,"release_month":1951,"context_length":115,"inference_mode":2654,"input_price_per_1m_tokens":2038,"output_price_per_1m_tokens":288,"input_price":2038,"output_price":288,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":963,"benchmark_gpqa":2045,"benchmark_hle":960,"benchmark_ifbench":1610,"benchmark_lcr":2667,"benchmark_livecodebench":1713,"benchmark_math_hard":12,"benchmark_mmlu_pro":567,"benchmark_scicode":2753,"benchmark_tau2":2322,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":963,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":570,"benchmark_coding":363},"43c816b4-fe68-4772-92ac-03c5308689a7","33935f10-8371-4635-a796-7f02b536c738","Liquid AI","LFM2 8B A1B",{"aa_id":4536,"ppt_model_id":4537,"slug":2048,"model_name":2049,"provider_name":1833,"name":2049,"provider":1833,"aa_name":2049,"is_open":11,"author_country":2817,"release_date":2051,"release_month":1951,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":2052,"output_price_per_1m_tokens":2053,"input_price":2052,"output_price":2053,"tokens_per_second":4538,"time_to_first_token":4539,"benchmark_aime":12,"benchmark_aime_25":2965,"benchmark_gpqa":3236,"benchmark_hle":1004,"benchmark_ifbench":2350,"benchmark_lcr":3239,"benchmark_livecodebench":2054,"benchmark_math_hard":12,"benchmark_mmlu_pro":3175,"benchmark_scicode":4540,"benchmark_tau2":119,"benchmark_terminalbench":427,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":577,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3160,"benchmark_coding":1068},"5bbae700-a12d-4cd3-8ac4-28a7f2b83181","7d9a95b9-e031-493d-bfdd-98e1852609d6",80.836,1.132,30.099999999999998,{"aa_id":4542,"ppt_model_id":4543,"slug":2057,"model_name":2058,"provider_name":3889,"name":2058,"provider":3889,"aa_name":4544,"is_open":37,"author_country":2817,"release_date":2060,"release_month":1951,"context_length":2061,"inference_mode":2654,"input_price_per_1m_tokens":2062,"output_price_per_1m_tokens":61,"input_price":2062,"output_price":61,"tokens_per_second":4545,"time_to_first_token":4546,"benchmark_aime":12,"benchmark_aime_25":4162,"benchmark_gpqa":1255,"benchmark_hle":2094,"benchmark_ifbench":656,"benchmark_lcr":1786,"benchmark_livecodebench":2063,"benchmark_math_hard":12,"benchmark_mmlu_pro":1192,"benchmark_scicode":265,"benchmark_tau2":2348,"benchmark_terminalbench":3419,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4547,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4548,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4162,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1071,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":265,"benchmark_coding":119},"b3e6b18d-11be-4c46-a1bd-23b6e2cbf67a","c2abef0e-6eee-4ef9-af65-1a8ea5a9b0fd","MiniMax-M2",51.188,1.408,85.1081,84.3649,{"aa_id":4550,"ppt_model_id":4551,"slug":2066,"model_name":4552,"provider_name":2892,"name":2067,"provider":2892,"aa_name":4553,"is_open":37,"author_country":2653,"release_date":2069,"release_month":1951,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":4554,"time_to_first_token":4555,"benchmark_aime":12,"benchmark_aime_25":1351,"benchmark_gpqa":4556,"benchmark_hle":1146,"benchmark_ifbench":2694,"benchmark_lcr":1201,"benchmark_livecodebench":2693,"benchmark_math_hard":12,"benchmark_mmlu_pro":1551,"benchmark_scicode":2836,"benchmark_tau2":317,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":580,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":157,"benchmark_mmlu_pro_reasoning":1551,"benchmark_gpqa_reasoning":2072,"benchmark_aime_25_reasoning":1351,"benchmark_hle_reasoning":1146,"benchmark_scicode_reasoning":916,"benchmark_ifbench_reasoning":3865,"benchmark_lcr_reasoning":1201,"benchmark_terminalbench_reasoning":545,"benchmark_tau2_reasoning":317,"benchmark_intelligence":4557,"benchmark_coding":4243,"benchmark_intelligence_reasoning":2074,"benchmark_coding_reasoning":2073,"benchmark_math_reasoning":1351},"cb316445-6b3b-49a1-848b-55c48964db6c","e2ca0467-cf54-4fa6-92f0-5a2921d9cc28","Nemotron Nano 12B 2 VL (Reasoning)","NVIDIA Nemotron Nano 12B v2 VL (Reasoning)",131.087,0.232,57.199999999999996,10.1,{"aa_id":4559,"ppt_model_id":4551,"slug":2066,"model_name":2067,"provider_name":2892,"name":2067,"provider":2892,"aa_name":4560,"is_open":37,"author_country":2653,"release_date":2069,"release_month":1951,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":4561,"time_to_first_token":4562,"benchmark_aime":12,"benchmark_aime_25":2779,"benchmark_gpqa":2070,"benchmark_hle":545,"benchmark_ifbench":2788,"benchmark_lcr":2098,"benchmark_livecodebench":2071,"benchmark_math_hard":12,"benchmark_mmlu_pro":329,"benchmark_scicode":4563,"benchmark_tau2":3460,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":580,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":157,"benchmark_mmlu_pro_reasoning":1551,"benchmark_gpqa_reasoning":2072,"benchmark_aime_25_reasoning":1351,"benchmark_hle_reasoning":1146,"benchmark_scicode_reasoning":916,"benchmark_ifbench_reasoning":3865,"benchmark_lcr_reasoning":1201,"benchmark_terminalbench_reasoning":545,"benchmark_tau2_reasoning":317,"benchmark_intelligence":4557,"benchmark_coding":4243,"benchmark_intelligence_reasoning":2074,"benchmark_coding_reasoning":2073,"benchmark_math_reasoning":1351},"a6a91e37-e0f0-45ec-93e2-4bf0ad6df7bd","NVIDIA Nemotron Nano 12B v2 VL (Non-reasoning)",139.59,0.558,17.599999999999998,{"aa_id":4565,"ppt_model_id":4566,"slug":2090,"model_name":2091,"provider_name":595,"name":2091,"provider":595,"aa_name":4567,"is_open":11,"author_country":2653,"release_date":2093,"release_month":1951,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":2094,"input_price":220,"output_price":2094,"tokens_per_second":4568,"time_to_first_token":4569,"benchmark_aime":2098,"benchmark_aime_25":2775,"benchmark_gpqa":4570,"benchmark_hle":3012,"benchmark_ifbench":4316,"benchmark_lcr":16,"benchmark_livecodebench":2096,"benchmark_math_hard":4571,"benchmark_mmlu_pro":487,"benchmark_scicode":3739,"benchmark_tau2":388,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":330,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1243,"benchmark_coding":1209},"35d3af20-7540-4534-8f39-6d087d43ba6b","09d517c4-dfef-434c-9408-e73521003c09","Nova Premier",64.064,0.889,56.89999999999999,83.89999999999999,{"aa_id":12,"ppt_model_id":4573,"slug":2101,"model_name":2102,"provider_name":1522,"name":2102,"provider":1522,"aa_name":12,"is_open":37,"author_country":2817,"release_date":2104,"release_month":2105,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":2106,"output_price_per_1m_tokens":78,"input_price":2106,"output_price":78,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4548,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"5548fade-b22b-46c7-ab24-423c1c3a49fd",{"aa_id":4575,"ppt_model_id":4576,"slug":2109,"model_name":2110,"provider_name":4577,"name":2110,"provider":4577,"aa_name":2110,"is_open":37,"author_country":2817,"release_date":2113,"release_month":2105,"context_length":981,"inference_mode":2654,"input_price_per_1m_tokens":2114,"output_price_per_1m_tokens":2115,"input_price":2114,"output_price":2115,"tokens_per_second":4578,"time_to_first_token":4579,"benchmark_aime":12,"benchmark_aime_25":3252,"benchmark_gpqa":1876,"benchmark_hle":859,"benchmark_ifbench":1598,"benchmark_lcr":4580,"benchmark_livecodebench":653,"benchmark_math_hard":12,"benchmark_mmlu_pro":1166,"benchmark_scicode":2906,"benchmark_tau2":4581,"benchmark_terminalbench":3983,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":893,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2337,"benchmark_coding":3388},"d522a0c3-6628-4f66-a66e-29fcf43f19a6","a7a1b7ad-c34a-462f-8d0f-a1fbdb1d3304","KwaiKAT",99.094,1.575,74,88.6,{"aa_id":4583,"ppt_model_id":4584,"slug":2118,"model_name":2119,"provider_name":9,"name":2119,"provider":9,"aa_name":4585,"is_open":11,"author_country":2653,"release_date":2121,"release_month":2105,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":78,"input_price":143,"output_price":78,"tokens_per_second":4586,"time_to_first_token":4587,"benchmark_aime":12,"benchmark_aime_25":2156,"benchmark_gpqa":1166,"benchmark_hle":2898,"benchmark_ifbench":654,"benchmark_lcr":4588,"benchmark_livecodebench":1375,"benchmark_math_hard":12,"benchmark_mmlu_pro":1192,"benchmark_scicode":276,"benchmark_tau2":4589,"benchmark_terminalbench":3213,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2156,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1932,"benchmark_coding":4590},"df8c1676-eb88-4271-8852-1db9e0000768","8bb9bbbf-65d6-4c3c-ba48-cde985c539f8","GPT-5.1 Codex mini (high)",191.375,4.033,62.7,62.9,36.4,{"aa_id":4592,"ppt_model_id":4593,"slug":2124,"model_name":2125,"provider_name":9,"name":2125,"provider":9,"aa_name":4594,"is_open":11,"author_country":2653,"release_date":2127,"release_month":2105,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":144,"output_price_per_1m_tokens":156,"input_price":144,"output_price":156,"tokens_per_second":4595,"time_to_first_token":4596,"benchmark_aime":12,"benchmark_aime_25":943,"benchmark_gpqa":871,"benchmark_hle":2744,"benchmark_ifbench":1188,"benchmark_lcr":4070,"benchmark_livecodebench":3804,"benchmark_math_hard":12,"benchmark_mmlu_pro":871,"benchmark_scicode":722,"benchmark_tau2":2393,"benchmark_terminalbench":3429,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":943,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4440,"benchmark_coding":2906},"ccdc2449-2707-4449-9fa6-0060adf02aeb","3bccdb83-1e8c-45b4-90d1-9fd02056ea15","GPT-5.1 Codex (high)",144.259,5.867,{"aa_id":4598,"ppt_model_id":4599,"slug":2136,"model_name":2137,"provider_name":9,"name":2137,"provider":9,"aa_name":4600,"is_open":11,"author_country":2653,"release_date":2139,"release_month":2105,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"tokens_per_second":4601,"time_to_first_token":4602,"benchmark_aime":12,"benchmark_aime_25":1158,"benchmark_gpqa":905,"benchmark_hle":3411,"benchmark_ifbench":4292,"benchmark_lcr":1351,"benchmark_livecodebench":2348,"benchmark_math_hard":12,"benchmark_mmlu_pro":1379,"benchmark_scicode":624,"benchmark_tau2":3365,"benchmark_terminalbench":4603,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4604,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4605,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":4606,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3774,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4607,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4022,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1845,"benchmark_coding":3777},"dcb50b5e-795e-4da3-a994-2d297e571556","e3cef3fd-3245-4bb4-b038-65c6df636706","GPT-5.1 (high)",97.145,27.372,45.5,69.4423,69.7896,94.5122,60.6667,{"aa_id":4609,"ppt_model_id":4599,"slug":2136,"model_name":2137,"provider_name":9,"name":2137,"provider":9,"aa_name":4610,"is_open":11,"author_country":2653,"release_date":2139,"release_month":2105,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":107,"output_price_per_1m_tokens":505,"input_price":107,"output_price":505,"tokens_per_second":4611,"time_to_first_token":4612,"benchmark_aime":12,"benchmark_aime_25":3774,"benchmark_gpqa":1233,"benchmark_hle":2835,"benchmark_ifbench":4613,"benchmark_lcr":1324,"benchmark_livecodebench":2140,"benchmark_math_hard":12,"benchmark_mmlu_pro":3859,"benchmark_scicode":1644,"benchmark_tau2":484,"benchmark_terminalbench":4094,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4604,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4605,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":4606,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3774,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4607,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4022,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1845,"benchmark_coding":3777},"9d12d1e1-fd48-48db-ad60-d0f1f28b3897","GPT-5.1 (Non-reasoning)",90.941,0.665,43.2,{"aa_id":4615,"ppt_model_id":4616,"slug":2150,"model_name":2151,"provider_name":248,"name":2151,"provider":248,"aa_name":4617,"is_open":11,"author_country":2653,"release_date":2153,"release_month":2105,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":558,"input_price":78,"output_price":558,"tokens_per_second":4618,"time_to_first_token":4619,"benchmark_aime":12,"benchmark_aime_25":943,"benchmark_gpqa":2155,"benchmark_hle":4620,"benchmark_ifbench":4621,"benchmark_lcr":1024,"benchmark_livecodebench":2156,"benchmark_math_hard":12,"benchmark_mmlu_pro":2154,"benchmark_scicode":4486,"benchmark_tau2":1221,"benchmark_terminalbench":2933,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4622,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4623,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":943,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":673,"benchmark_coding":484},"cb7d1c71-104e-42bd-8df5-426b84289b5a","6000a5ec-8f26-4423-9246-70e7e0170662","Gemini 3 Pro Preview (high)",114.876,25.531,37.2,70.39999999999999,93.205,93.7798,{"aa_id":4625,"ppt_model_id":4626,"slug":2159,"model_name":4627,"provider_name":3823,"name":2160,"provider":3823,"aa_name":4627,"is_open":11,"author_country":2653,"release_date":2162,"release_month":2105,"context_length":1842,"inference_mode":3250,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":25,"input_price":377,"output_price":25,"tokens_per_second":4628,"time_to_first_token":4629,"benchmark_aime":12,"benchmark_aime_25":973,"benchmark_gpqa":994,"benchmark_hle":4563,"benchmark_ifbench":133,"benchmark_lcr":3117,"benchmark_livecodebench":3712,"benchmark_math_hard":12,"benchmark_mmlu_pro":4190,"benchmark_scicode":2497,"benchmark_tau2":3697,"benchmark_terminalbench":4267,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4630,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4631,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1184,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4632,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1313,"benchmark_mmlu_pro_reasoning":2165,"benchmark_gpqa_reasoning":994,"benchmark_aime_25_reasoning":973,"benchmark_hle_reasoning":1556,"benchmark_scicode_reasoning":2497,"benchmark_ifbench_reasoning":133,"benchmark_lcr_reasoning":3117,"benchmark_terminalbench_reasoning":4267,"benchmark_tau2_reasoning":1271,"benchmark_intelligence":4633,"benchmark_coding":4634,"benchmark_intelligence_reasoning":1932,"benchmark_coding_reasoning":2166,"benchmark_math_reasoning":973},"41d8a4fc-4a40-4b8f-ba10-a88fb54e12b6","388fe3db-9e27-44d1-a3d6-855a3942a063","Grok 4.1 Fast (Reasoning)",128.891,8.47,67.3998,72.078,0.6667,23.6,19.5,{"aa_id":4636,"ppt_model_id":4626,"slug":2159,"model_name":2160,"provider_name":3823,"name":2160,"provider":3823,"aa_name":4637,"is_open":11,"author_country":2653,"release_date":2162,"release_month":2105,"context_length":1842,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":25,"input_price":377,"output_price":25,"tokens_per_second":4638,"time_to_first_token":50,"benchmark_aime":12,"benchmark_aime_25":3596,"benchmark_gpqa":2163,"benchmark_hle":505,"benchmark_ifbench":1644,"benchmark_lcr":995,"benchmark_livecodebench":3176,"benchmark_math_hard":12,"benchmark_mmlu_pro":1237,"benchmark_scicode":2718,"benchmark_tau2":2163,"benchmark_terminalbench":4639,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4640,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4641,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1184,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4632,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1313,"benchmark_mmlu_pro_reasoning":2165,"benchmark_gpqa_reasoning":994,"benchmark_aime_25_reasoning":973,"benchmark_hle_reasoning":1556,"benchmark_scicode_reasoning":2497,"benchmark_ifbench_reasoning":133,"benchmark_lcr_reasoning":3117,"benchmark_terminalbench_reasoning":4267,"benchmark_tau2_reasoning":1271,"benchmark_intelligence":4633,"benchmark_coding":4634,"benchmark_intelligence_reasoning":1932,"benchmark_coding_reasoning":2166,"benchmark_math_reasoning":973},"1882b720-e14e-4ae6-8c58-577c21556ca2","Grok 4.1 Fast (Non-reasoning)",115.232,14.399999999999999,66.9678,71.5558,{"aa_id":4643,"ppt_model_id":4644,"slug":2175,"model_name":2176,"provider_name":3400,"name":2176,"provider":3400,"aa_name":2176,"is_open":37,"author_country":2653,"release_date":2178,"release_month":2105,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":411,"output_price_per_1m_tokens":377,"input_price":411,"output_price":377,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":1024,"benchmark_gpqa":449,"benchmark_hle":230,"benchmark_ifbench":3665,"benchmark_lcr":2667,"benchmark_livecodebench":712,"benchmark_math_hard":12,"benchmark_mmlu_pro":1342,"benchmark_scicode":1023,"benchmark_tau2":2667,"benchmark_terminalbench":524,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1024,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3015,"benchmark_coding":3413},"18c8bd85-690a-4713-841e-325ebcd3c27b","1474e551-56de-4880-bd62-b04c2a22fc8d",{"aa_id":4646,"ppt_model_id":4647,"slug":2181,"model_name":2182,"provider_name":3400,"name":2182,"provider":3400,"aa_name":2182,"is_open":37,"author_country":2653,"release_date":2184,"release_month":2105,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":377,"input_price":495,"output_price":377,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":3926,"benchmark_gpqa":1201,"benchmark_hle":4648,"benchmark_ifbench":3402,"benchmark_lcr":2667,"benchmark_livecodebench":723,"benchmark_math_hard":12,"benchmark_mmlu_pro":1270,"benchmark_scicode":2944,"benchmark_tau2":1144,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3926,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4649,"benchmark_coding":1536},"b4d91d25-533f-4ab6-98eb-12db6b4f65e4","866f6cf4-cb04-46d9-a910-3c7e867f82a6",5.800000000000001,8.2,{"aa_id":4651,"ppt_model_id":4652,"slug":2187,"model_name":2188,"provider_name":3400,"name":2188,"provider":3400,"aa_name":2188,"is_open":37,"author_country":2653,"release_date":2190,"release_month":2105,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":25,"input_price":273,"output_price":25,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":160,"benchmark_gpqa":1786,"benchmark_hle":3691,"benchmark_ifbench":413,"benchmark_lcr":2667,"benchmark_livecodebench":1661,"benchmark_math_hard":12,"benchmark_mmlu_pro":1551,"benchmark_scicode":2789,"benchmark_tau2":2667,"benchmark_terminalbench":26,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":160,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3245,"benchmark_coding":2322},"f11b617c-6da1-45d4-86a8-6d3485a5a288","33efe38f-e981-42b3-ad8c-1fe42c09b8e3",{"aa_id":4654,"ppt_model_id":4655,"slug":2193,"model_name":4656,"provider_name":138,"name":2194,"provider":138,"aa_name":4656,"is_open":11,"author_country":2653,"release_date":2196,"release_month":2105,"context_length":142,"inference_mode":3250,"input_price_per_1m_tokens":505,"output_price_per_1m_tokens":174,"input_price":505,"output_price":174,"tokens_per_second":4657,"time_to_first_token":4658,"benchmark_aime":12,"benchmark_aime_25":1135,"benchmark_gpqa":1499,"benchmark_hle":3961,"benchmark_ifbench":3640,"benchmark_lcr":4580,"benchmark_livecodebench":1221,"benchmark_math_hard":12,"benchmark_mmlu_pro":2197,"benchmark_scicode":1415,"benchmark_tau2":2197,"benchmark_terminalbench":1219,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4588,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4659,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4660,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1221,"benchmark_mmlu_pro_reasoning":2197,"benchmark_gpqa_reasoning":1499,"benchmark_aime_25_reasoning":1135,"benchmark_hle_reasoning":3961,"benchmark_scicode_reasoning":1415,"benchmark_ifbench_reasoning":3633,"benchmark_lcr_reasoning":4580,"benchmark_terminalbench_reasoning":1219,"benchmark_tau2_reasoning":2197,"benchmark_intelligence":4440,"benchmark_coding":4194,"benchmark_intelligence_reasoning":2199,"benchmark_coding_reasoning":2198,"benchmark_math_reasoning":1135},"7a42bd68-1fe9-4866-bf08-441cb05ea703","251c56dd-1f10-43a9-a79b-eeaae13f4e65","Claude Opus 4.5 (Reasoning)",51.401,10.218,76.3333,49.3333,{"aa_id":4662,"ppt_model_id":4655,"slug":2193,"model_name":2194,"provider_name":138,"name":2194,"provider":138,"aa_name":4663,"is_open":11,"author_country":2653,"release_date":2196,"release_month":2105,"context_length":142,"inference_mode":2654,"input_price_per_1m_tokens":505,"output_price_per_1m_tokens":174,"input_price":505,"output_price":174,"tokens_per_second":4664,"time_to_first_token":4665,"benchmark_aime":12,"benchmark_aime_25":4588,"benchmark_gpqa":690,"benchmark_hle":2936,"benchmark_ifbench":1124,"benchmark_lcr":1764,"benchmark_livecodebench":1608,"benchmark_math_hard":12,"benchmark_mmlu_pro":1070,"benchmark_scicode":1219,"benchmark_tau2":1253,"benchmark_terminalbench":326,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4588,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4659,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4660,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1221,"benchmark_mmlu_pro_reasoning":2197,"benchmark_gpqa_reasoning":1499,"benchmark_aime_25_reasoning":1135,"benchmark_hle_reasoning":3961,"benchmark_scicode_reasoning":1415,"benchmark_ifbench_reasoning":3633,"benchmark_lcr_reasoning":4580,"benchmark_terminalbench_reasoning":1219,"benchmark_tau2_reasoning":2197,"benchmark_intelligence":4440,"benchmark_coding":4194,"benchmark_intelligence_reasoning":2199,"benchmark_coding_reasoning":2198,"benchmark_math_reasoning":1135},"b42b4cea-b810-4501-9bcb-d6f6a03f025a","Claude Opus 4.5 (Non-reasoning)",50.559,1.262,{"aa_id":4667,"ppt_model_id":4668,"slug":2202,"model_name":2203,"provider_name":4669,"name":2203,"provider":4669,"aa_name":2203,"is_open":37,"author_country":2653,"release_date":2206,"release_month":2105,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":700,"input_price":377,"output_price":700,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":1643,"benchmark_gpqa":2207,"benchmark_hle":3245,"benchmark_ifbench":1357,"benchmark_lcr":3906,"benchmark_livecodebench":1255,"benchmark_math_hard":12,"benchmark_mmlu_pro":3712,"benchmark_scicode":3928,"benchmark_tau2":723,"benchmark_terminalbench":3983,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4670,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":4671,"benchmark_bird_critic":4672,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4673,"benchmark_humaneval":3183,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1643,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1420,"benchmark_coding":4674},"6e8d326e-6511-428a-b4ad-b54b58f3cff3","8ef11470-a584-448d-9a91-18a3cb3cc419","Prime Intellect",86.4493,63.4542,24.6667,94.7688,19.1,{"aa_id":4676,"ppt_model_id":4677,"slug":2210,"model_name":4678,"provider_name":3115,"name":2211,"provider":3115,"aa_name":4678,"is_open":37,"author_country":2817,"release_date":2213,"release_month":2214,"context_length":670,"inference_mode":3250,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":2215,"input_price":793,"output_price":2215,"tokens_per_second":4679,"time_to_first_token":4680,"benchmark_aime":12,"benchmark_aime_25":2216,"benchmark_gpqa":1190,"benchmark_hle":1420,"benchmark_ifbench":3251,"benchmark_lcr":4368,"benchmark_livecodebench":1406,"benchmark_math_hard":12,"benchmark_mmlu_pro":1406,"benchmark_scicode":4136,"benchmark_tau2":4681,"benchmark_terminalbench":4453,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4682,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":4529,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":623,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1406,"benchmark_mmlu_pro_reasoning":1406,"benchmark_gpqa_reasoning":1190,"benchmark_aime_25_reasoning":2216,"benchmark_hle_reasoning":1420,"benchmark_scicode_reasoning":4136,"benchmark_ifbench_reasoning":3275,"benchmark_lcr_reasoning":4368,"benchmark_terminalbench_reasoning":4453,"benchmark_tau2_reasoning":3532,"benchmark_intelligence":3847,"benchmark_coding":2263,"benchmark_intelligence_reasoning":554,"benchmark_coding_reasoning":1686,"benchmark_math_reasoning":2216},"91fb2fa1-db9a-4f48-aa58-4f6a88b2b2f7","3342239a-0ccc-4e5d-891e-84d667cb75d2","DeepSeek V3.2 (Reasoning)",35.65,1.432,90.60000000000001,88.4964,{"aa_id":4684,"ppt_model_id":4677,"slug":2210,"model_name":2211,"provider_name":3115,"name":2211,"provider":3115,"aa_name":4685,"is_open":37,"author_country":2817,"release_date":2213,"release_month":2214,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":2215,"input_price":793,"output_price":2215,"tokens_per_second":4686,"time_to_first_token":4687,"benchmark_aime":12,"benchmark_aime_25":623,"benchmark_gpqa":1709,"benchmark_hle":2322,"benchmark_ifbench":3676,"benchmark_lcr":1071,"benchmark_livecodebench":1553,"benchmark_math_hard":12,"benchmark_mmlu_pro":891,"benchmark_scicode":118,"benchmark_tau2":279,"benchmark_terminalbench":1111,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":623,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":1406,"benchmark_mmlu_pro_reasoning":1406,"benchmark_gpqa_reasoning":1190,"benchmark_aime_25_reasoning":2216,"benchmark_hle_reasoning":1420,"benchmark_scicode_reasoning":4136,"benchmark_ifbench_reasoning":3275,"benchmark_lcr_reasoning":4368,"benchmark_terminalbench_reasoning":4453,"benchmark_tau2_reasoning":3532,"benchmark_intelligence":3847,"benchmark_coding":2263,"benchmark_intelligence_reasoning":554,"benchmark_coding_reasoning":1686,"benchmark_math_reasoning":2216},"145f1eff-6844-4d2e-b905-42f334073187","DeepSeek V3.2 (Non-reasoning)",34.852,1.415,{"aa_id":4689,"ppt_model_id":4690,"slug":2219,"model_name":2220,"provider_name":3115,"name":2220,"provider":3115,"aa_name":2220,"is_open":37,"author_country":2817,"release_date":2222,"release_month":2214,"context_length":670,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":182,"input_price":536,"output_price":182,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":1408,"benchmark_gpqa":1221,"benchmark_hle":568,"benchmark_ifbench":158,"benchmark_lcr":1553,"benchmark_livecodebench":4691,"benchmark_math_hard":12,"benchmark_mmlu_pro":1253,"benchmark_scicode":1324,"benchmark_tau2":2667,"benchmark_terminalbench":3429,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1408,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3013,"benchmark_coding":198},"f8dce6a3-9d23-4fe4-8ab9-acefc77277b7","f722eb72-0454-49fc-85d1-7bdfacc37c6d",89.60000000000001,{"aa_id":12,"ppt_model_id":4693,"slug":2233,"model_name":2234,"provider_name":83,"name":2234,"provider":83,"aa_name":12,"is_open":37,"author_country":2666,"release_date":2236,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":26,"input_price":25,"output_price":26,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4694,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4695,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":174,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3588,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2765,"benchmark_wmdp":12,"benchmark_wmt":12},"ac4606ba-e553-4989-b763-ee5e701db2ec",73.9984,18.7389,{"aa_id":4697,"ppt_model_id":4698,"slug":2245,"model_name":2246,"provider_name":2665,"name":2246,"provider":2665,"aa_name":4699,"is_open":37,"author_country":2666,"release_date":2248,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":273,"input_price":273,"output_price":273,"tokens_per_second":4700,"time_to_first_token":4701,"benchmark_aime":12,"benchmark_aime_25":2096,"benchmark_gpqa":3052,"benchmark_hle":2787,"benchmark_ifbench":2692,"benchmark_lcr":3506,"benchmark_livecodebench":1203,"benchmark_math_hard":12,"benchmark_mmlu_pro":2249,"benchmark_scicode":2676,"benchmark_tau2":723,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":2096,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":185,"benchmark_coding":156},"ec849f68-fba8-46f6-bcfc-b494f4b57072","a2152d25-d551-4a3f-9290-9af73c2e1cdc","Ministral 3 8B",151.831,0.311,{"aa_id":4703,"ppt_model_id":4704,"slug":2252,"model_name":2253,"provider_name":2665,"name":2253,"provider":2665,"aa_name":4705,"is_open":11,"author_country":2666,"release_date":2255,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":4706,"time_to_first_token":4707,"benchmark_aime":12,"benchmark_aime_25":16,"benchmark_gpqa":4556,"benchmark_hle":2776,"benchmark_ifbench":3507,"benchmark_lcr":995,"benchmark_livecodebench":2674,"benchmark_math_hard":12,"benchmark_mmlu_pro":1528,"benchmark_scicode":3168,"benchmark_tau2":3597,"benchmark_terminalbench":545,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":16,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":417,"benchmark_coding":1712},"16383a5b-5102-4071-aaa6-e16a05425d5a","6033ce64-0d25-4d19-9294-aaae47440ad6","Ministral 3 14B",131.457,0.339,{"aa_id":4709,"ppt_model_id":4710,"slug":2258,"model_name":2259,"provider_name":595,"name":2259,"provider":595,"aa_name":4711,"is_open":11,"author_country":2653,"release_date":2261,"release_month":2214,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":220,"input_price":50,"output_price":220,"tokens_per_second":4712,"time_to_first_token":4713,"benchmark_aime":12,"benchmark_aime_25":917,"benchmark_gpqa":2262,"benchmark_hle":68,"benchmark_ifbench":209,"benchmark_lcr":3037,"benchmark_livecodebench":3960,"benchmark_math_hard":12,"benchmark_mmlu_pro":1237,"benchmark_scicode":3506,"benchmark_tau2":4714,"benchmark_terminalbench":2753,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":917,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3090,"benchmark_coding":2094},"2f0a8227-1f85-4bad-8e25-2d704c755bf3","ca290f3e-5253-4047-a140-ab3f11733870","Nova 2.0 Lite (Non-reasoning)",196.699,0.547,62,{"aa_id":4716,"ppt_model_id":4717,"slug":2287,"model_name":4718,"provider_name":4066,"name":2288,"provider":4066,"aa_name":4719,"is_open":37,"author_country":2653,"release_date":2290,"release_month":2214,"context_length":287,"inference_mode":3250,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":312,"input_price":50,"output_price":312,"tokens_per_second":4720,"time_to_first_token":3205,"benchmark_aime":12,"benchmark_aime_25":994,"benchmark_gpqa":4721,"benchmark_hle":1110,"benchmark_ifbench":4540,"benchmark_lcr":3253,"benchmark_livecodebench":417,"benchmark_math_hard":12,"benchmark_mmlu_pro":2293,"benchmark_scicode":2860,"benchmark_tau2":2964,"benchmark_terminalbench":4639,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4500,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1610,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1254,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":417,"benchmark_mmlu_pro_reasoning":2293,"benchmark_gpqa_reasoning":2294,"benchmark_aime_25_reasoning":994,"benchmark_hle_reasoning":1110,"benchmark_scicode_reasoning":2860,"benchmark_ifbench_reasoning":2437,"benchmark_lcr_reasoning":1628,"benchmark_terminalbench_reasoning":1765,"benchmark_tau2_reasoning":2964,"benchmark_intelligence":3819,"benchmark_coding":1636,"benchmark_intelligence_reasoning":278,"benchmark_coding_reasoning":2295,"benchmark_math_reasoning":994},"72d1b25a-cb3f-453c-8806-5f7523536f2f","66d13cca-1879-4ef3-9b4d-1315e806aa05","GLM 4.6V (Reasoning)","GLM-4.6V (Reasoning)",25.089,71.89999999999999,{"aa_id":4723,"ppt_model_id":4717,"slug":2287,"model_name":2288,"provider_name":4066,"name":2288,"provider":4066,"aa_name":4724,"is_open":37,"author_country":2653,"release_date":2290,"release_month":2214,"context_length":287,"inference_mode":2654,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":312,"input_price":50,"output_price":312,"tokens_per_second":4725,"time_to_first_token":4726,"benchmark_aime":12,"benchmark_aime_25":1610,"benchmark_gpqa":4727,"benchmark_hle":3403,"benchmark_ifbench":3739,"benchmark_lcr":2685,"benchmark_livecodebench":4207,"benchmark_math_hard":12,"benchmark_mmlu_pro":1040,"benchmark_scicode":3597,"benchmark_tau2":2896,"benchmark_terminalbench":68,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4500,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1610,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":1254,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":417,"benchmark_mmlu_pro_reasoning":2293,"benchmark_gpqa_reasoning":2294,"benchmark_aime_25_reasoning":994,"benchmark_hle_reasoning":1110,"benchmark_scicode_reasoning":2860,"benchmark_ifbench_reasoning":2437,"benchmark_lcr_reasoning":1628,"benchmark_terminalbench_reasoning":1765,"benchmark_tau2_reasoning":2964,"benchmark_intelligence":3819,"benchmark_coding":1636,"benchmark_intelligence_reasoning":278,"benchmark_coding_reasoning":2295,"benchmark_math_reasoning":994},"fd3afb4b-7ee5-4cd6-a056-31576b95333a","GLM-4.6V (Non-reasoning)",21.614,1.35,56.599999999999994,{"aa_id":4729,"ppt_model_id":4730,"slug":2304,"model_name":2305,"provider_name":2665,"name":2305,"provider":2665,"aa_name":4731,"is_open":37,"author_country":2666,"release_date":2307,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":312,"input_price":536,"output_price":312,"tokens_per_second":4732,"time_to_first_token":536,"benchmark_aime":12,"benchmark_aime_25":1686,"benchmark_gpqa":636,"benchmark_hle":2943,"benchmark_ifbench":514,"benchmark_lcr":16,"benchmark_livecodebench":4733,"benchmark_math_hard":12,"benchmark_mmlu_pro":781,"benchmark_scicode":2733,"benchmark_tau2":3659,"benchmark_terminalbench":2711,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1686,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":995,"benchmark_coding":1113},"e8096426-41d2-49a4-b826-b903ef8032b7","7616fd8a-5936-490e-a4a2-3d8b0df97880","Devstral 2",74.137,44.800000000000004,{"aa_id":4735,"ppt_model_id":4736,"slug":2311,"model_name":2312,"provider_name":9,"name":2312,"provider":9,"aa_name":4737,"is_open":11,"author_country":2653,"release_date":2314,"release_month":2214,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"tokens_per_second":4738,"time_to_first_token":4739,"benchmark_aime":12,"benchmark_aime_25":974,"benchmark_gpqa":982,"benchmark_hle":3148,"benchmark_ifbench":146,"benchmark_lcr":3774,"benchmark_livecodebench":958,"benchmark_math_hard":12,"benchmark_mmlu_pro":4499,"benchmark_scicode":3517,"benchmark_tau2":484,"benchmark_terminalbench":2349,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4740,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4741,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":974,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4742,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4743,"benchmark_coding":425},"0e02d475-2d84-4167-b137-4c4b2bc412d1","339acfd7-f6a6-4d63-89b3-819191841d95","GPT-5.2 (Non-reasoning)",67.905,0.619,71.7203,67.5933,62.3333,33.6,{"aa_id":4745,"ppt_model_id":4746,"slug":2318,"model_name":2319,"provider_name":9,"name":2319,"provider":9,"aa_name":4747,"is_open":11,"author_country":2653,"release_date":2321,"release_month":2214,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":2322,"output_price_per_1m_tokens":1190,"input_price":2322,"output_price":1190,"tokens_per_second":4748,"time_to_first_token":4749,"benchmark_aime":12,"benchmark_aime_25":1501,"benchmark_gpqa":1169,"benchmark_hle":3430,"benchmark_ifbench":4176,"benchmark_lcr":1200,"benchmark_livecodebench":1070,"benchmark_math_hard":12,"benchmark_mmlu_pro":2323,"benchmark_scicode":2730,"benchmark_tau2":1112,"benchmark_terminalbench":1219,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1501,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4035,"benchmark_coding":737},"69d843fd-aaaf-4d15-8849-26ec93c858b3","f5e8b5ab-bf13-41d8-988f-649bf830a38b","GPT-5.2 (xhigh)",70.499,101.222,{"aa_id":4751,"ppt_model_id":4752,"slug":2333,"model_name":4753,"provider_name":2892,"name":2334,"provider":2892,"aa_name":4754,"is_open":37,"author_country":2653,"release_date":2336,"release_month":2214,"context_length":1477,"inference_mode":3250,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"tokens_per_second":4755,"time_to_first_token":4756,"benchmark_aime":12,"benchmark_aime_25":918,"benchmark_gpqa":1356,"benchmark_hle":4095,"benchmark_ifbench":4757,"benchmark_lcr":917,"benchmark_livecodebench":2339,"benchmark_math_hard":12,"benchmark_mmlu_pro":2338,"benchmark_scicode":2718,"benchmark_tau2":326,"benchmark_terminalbench":3527,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":4758,"benchmark_bird_critic":4759,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4760,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3679,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2339,"benchmark_mmlu_pro_reasoning":2338,"benchmark_gpqa_reasoning":1356,"benchmark_aime_25_reasoning":918,"benchmark_hle_reasoning":4095,"benchmark_scicode_reasoning":210,"benchmark_ifbench_reasoning":4757,"benchmark_lcr_reasoning":917,"benchmark_terminalbench_reasoning":3229,"benchmark_tau2_reasoning":326,"benchmark_intelligence":1242,"benchmark_coding":4761,"benchmark_intelligence_reasoning":1236,"benchmark_coding_reasoning":1243,"benchmark_math_reasoning":918},"816af11c-6e2c-461f-9f58-73556b20df0b","f74cc70d-f621-4c13-a1d9-ed49a6616c19","Nemotron 3 Nano 30B A3B (Reasoning)","NVIDIA Nemotron 3 Nano 30B A3B (Reasoning)",146.421,1.054,71.1,41.6122,22.6667,95.3753,15.8,{"aa_id":4763,"ppt_model_id":4752,"slug":2333,"model_name":2334,"provider_name":2892,"name":2334,"provider":2892,"aa_name":4764,"is_open":37,"author_country":2653,"release_date":2336,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":299,"output_price_per_1m_tokens":377,"input_price":299,"output_price":377,"tokens_per_second":4765,"time_to_first_token":4766,"benchmark_aime":12,"benchmark_aime_25":3679,"benchmark_gpqa":3176,"benchmark_hle":2776,"benchmark_ifbench":4767,"benchmark_lcr":429,"benchmark_livecodebench":2337,"benchmark_math_hard":12,"benchmark_mmlu_pro":29,"benchmark_scicode":4768,"benchmark_tau2":1511,"benchmark_terminalbench":3245,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":4758,"benchmark_bird_critic":4759,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":4760,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":3679,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2339,"benchmark_mmlu_pro_reasoning":2338,"benchmark_gpqa_reasoning":1356,"benchmark_aime_25_reasoning":918,"benchmark_hle_reasoning":4095,"benchmark_scicode_reasoning":210,"benchmark_ifbench_reasoning":4757,"benchmark_lcr_reasoning":917,"benchmark_terminalbench_reasoning":3229,"benchmark_tau2_reasoning":326,"benchmark_intelligence":1242,"benchmark_coding":4761,"benchmark_intelligence_reasoning":1236,"benchmark_coding_reasoning":1243,"benchmark_math_reasoning":918},"5ac40c88-9acf-4adb-bd21-f68462cbc474","NVIDIA Nemotron 3 Nano 30B A3B (Non-reasoning)",84.548,0.276,37.5,23,{"aa_id":4770,"ppt_model_id":4771,"slug":2342,"model_name":2343,"provider_name":2344,"name":2343,"provider":2344,"aa_name":4772,"is_open":37,"author_country":2817,"release_date":2346,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":744,"input_price":404,"output_price":744,"tokens_per_second":4773,"time_to_first_token":4774,"benchmark_aime":12,"benchmark_aime_25":18,"benchmark_gpqa":785,"benchmark_hle":436,"benchmark_ifbench":4775,"benchmark_lcr":1233,"benchmark_livecodebench":722,"benchmark_math_hard":12,"benchmark_mmlu_pro":221,"benchmark_scicode":388,"benchmark_tau2":3697,"benchmark_terminalbench":3761,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":18,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2348,"benchmark_mmlu_pro_reasoning":1268,"benchmark_gpqa_reasoning":2347,"benchmark_aime_25_reasoning":2351,"benchmark_hle_reasoning":4776,"benchmark_scicode_reasoning":148,"benchmark_ifbench_reasoning":2249,"benchmark_lcr_reasoning":3158,"benchmark_terminalbench_reasoning":1220,"benchmark_tau2_reasoning":2385,"benchmark_intelligence":2860,"benchmark_coding":3419,"benchmark_intelligence_reasoning":2350,"benchmark_coding_reasoning":2349,"benchmark_math_reasoning":2351},"6f121be6-f491-4e39-896e-419b16366931","32b0be23-fa12-4165-bb81-849bbb517f5b","MiMo-V2-Flash (Feb 2026)",122.852,1.404,71.8,21.1,{"aa_id":4778,"ppt_model_id":4771,"slug":2342,"model_name":4779,"provider_name":2344,"name":2343,"provider":2344,"aa_name":4779,"is_open":37,"author_country":2817,"release_date":2346,"release_month":2214,"context_length":1477,"inference_mode":3250,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":744,"input_price":404,"output_price":744,"tokens_per_second":4780,"time_to_first_token":4781,"benchmark_aime":12,"benchmark_aime_25":2351,"benchmark_gpqa":2347,"benchmark_hle":2684,"benchmark_ifbench":2249,"benchmark_lcr":3158,"benchmark_livecodebench":2348,"benchmark_math_hard":12,"benchmark_mmlu_pro":1268,"benchmark_scicode":148,"benchmark_tau2":2385,"benchmark_terminalbench":3625,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":18,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2348,"benchmark_mmlu_pro_reasoning":1268,"benchmark_gpqa_reasoning":2347,"benchmark_aime_25_reasoning":2351,"benchmark_hle_reasoning":4776,"benchmark_scicode_reasoning":148,"benchmark_ifbench_reasoning":2249,"benchmark_lcr_reasoning":3158,"benchmark_terminalbench_reasoning":1220,"benchmark_tau2_reasoning":2385,"benchmark_intelligence":2860,"benchmark_coding":3419,"benchmark_intelligence_reasoning":2350,"benchmark_coding_reasoning":2349,"benchmark_math_reasoning":2351},"9bcf2252-9a8a-4ec0-ae4c-d794a370dd7e","MiMo-V2-Flash (Reasoning)",123.066,1.71,{"aa_id":4783,"ppt_model_id":4771,"slug":2342,"model_name":2343,"provider_name":2344,"name":2343,"provider":2344,"aa_name":4784,"is_open":37,"author_country":2817,"release_date":2346,"release_month":2214,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":404,"output_price_per_1m_tokens":744,"input_price":404,"output_price":744,"tokens_per_second":4785,"time_to_first_token":4786,"benchmark_aime":12,"benchmark_aime_25":18,"benchmark_gpqa":3279,"benchmark_hle":615,"benchmark_ifbench":3176,"benchmark_lcr":3239,"benchmark_livecodebench":722,"benchmark_math_hard":12,"benchmark_mmlu_pro":221,"benchmark_scicode":2788,"benchmark_tau2":4571,"benchmark_terminalbench":3419,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":18,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2348,"benchmark_mmlu_pro_reasoning":1268,"benchmark_gpqa_reasoning":2347,"benchmark_aime_25_reasoning":2351,"benchmark_hle_reasoning":4776,"benchmark_scicode_reasoning":148,"benchmark_ifbench_reasoning":2249,"benchmark_lcr_reasoning":3158,"benchmark_terminalbench_reasoning":1220,"benchmark_tau2_reasoning":2385,"benchmark_intelligence":2860,"benchmark_coding":3419,"benchmark_intelligence_reasoning":2350,"benchmark_coding_reasoning":2349,"benchmark_math_reasoning":2351},"f523d994-baac-4708-a4c1-36a7708ac21f","MiMo-V2-Flash (Non-reasoning)",118.933,1.835,{"aa_id":4788,"ppt_model_id":4789,"slug":2354,"model_name":2355,"provider_name":3400,"name":2355,"provider":3400,"aa_name":2355,"is_open":37,"author_country":2653,"release_date":2357,"release_month":2214,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":273,"output_price_per_1m_tokens":25,"input_price":273,"output_price":25,"tokens_per_second":4790,"time_to_first_token":4791,"benchmark_aime":12,"benchmark_aime_25":638,"benchmark_gpqa":4792,"benchmark_hle":565,"benchmark_ifbench":1145,"benchmark_lcr":2667,"benchmark_livecodebench":1417,"benchmark_math_hard":12,"benchmark_mmlu_pro":1224,"benchmark_scicode":2973,"benchmark_tau2":2667,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":638,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3415,"benchmark_coding":2702},"f384a402-af61-4528-a4bd-ef2051274fd9","8f863b63-a41e-4dbc-955f-c475214c42a0",90.37,0.423,59.099999999999994,{"aa_id":4794,"ppt_model_id":4795,"slug":2366,"model_name":4796,"provider_name":248,"name":2367,"provider":248,"aa_name":4796,"is_open":11,"author_country":2653,"release_date":2369,"release_month":2214,"context_length":856,"inference_mode":3250,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":68,"input_price":25,"output_price":68,"tokens_per_second":4797,"time_to_first_token":4798,"benchmark_aime":12,"benchmark_aime_25":655,"benchmark_gpqa":2154,"benchmark_hle":2837,"benchmark_ifbench":1943,"benchmark_lcr":3991,"benchmark_livecodebench":2155,"benchmark_math_hard":12,"benchmark_mmlu_pro":2372,"benchmark_scicode":1257,"benchmark_tau2":4799,"benchmark_terminalbench":1932,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4800,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":4801,"benchmark_bird_critic":12,"benchmark_darkbench":4802,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":915,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4803,"benchmark_wmdp":4804,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2155,"benchmark_mmlu_pro_reasoning":2372,"benchmark_gpqa_reasoning":2154,"benchmark_aime_25_reasoning":655,"benchmark_hle_reasoning":425,"benchmark_scicode_reasoning":1257,"benchmark_ifbench_reasoning":1943,"benchmark_lcr_reasoning":3991,"benchmark_terminalbench_reasoning":1932,"benchmark_tau2_reasoning":4799,"benchmark_intelligence":2732,"benchmark_coding":3892,"benchmark_intelligence_reasoning":446,"benchmark_coding_reasoning":276,"benchmark_math_reasoning":655},"a292fb35-f81b-46bb-b06d-8d38a36d6ecf","582c851f-480a-4333-b63b-c7c535bd66b5","Gemini 3 Flash Preview (Reasoning)",189.832,5.904,80.4,84.2498,53.5465,49.0909,12.6667,86.8048,{"aa_id":4806,"ppt_model_id":4795,"slug":2366,"model_name":2367,"provider_name":248,"name":2367,"provider":248,"aa_name":4807,"is_open":11,"author_country":2653,"release_date":2369,"release_month":2214,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":25,"output_price_per_1m_tokens":68,"input_price":25,"output_price":68,"tokens_per_second":4808,"time_to_first_token":4809,"benchmark_aime":12,"benchmark_aime_25":915,"benchmark_gpqa":2371,"benchmark_hle":4810,"benchmark_ifbench":1041,"benchmark_lcr":4396,"benchmark_livecodebench":1921,"benchmark_math_hard":12,"benchmark_mmlu_pro":2370,"benchmark_scicode":212,"benchmark_tau2":624,"benchmark_terminalbench":2349,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4800,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":4802,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":915,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4803,"benchmark_wmdp":4804,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2155,"benchmark_mmlu_pro_reasoning":2372,"benchmark_gpqa_reasoning":2154,"benchmark_aime_25_reasoning":655,"benchmark_hle_reasoning":425,"benchmark_scicode_reasoning":1257,"benchmark_ifbench_reasoning":1943,"benchmark_lcr_reasoning":3991,"benchmark_terminalbench_reasoning":1932,"benchmark_tau2_reasoning":4799,"benchmark_intelligence":2732,"benchmark_coding":3892,"benchmark_intelligence_reasoning":446,"benchmark_coding_reasoning":276,"benchmark_math_reasoning":655},"31eb38cb-655d-42e8-ac5b-0e4d1ab80b96","Gemini 3 Flash Preview (Non-reasoning)",172.251,4.302,14.099999999999998,{"aa_id":4812,"ppt_model_id":4813,"slug":2375,"model_name":4814,"provider_name":4066,"name":2376,"provider":4066,"aa_name":4815,"is_open":37,"author_country":2653,"release_date":2378,"release_month":2214,"context_length":2379,"inference_mode":3250,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":2315,"input_price":324,"output_price":2315,"tokens_per_second":4816,"time_to_first_token":4817,"benchmark_aime":12,"benchmark_aime_25":2385,"benchmark_gpqa":1156,"benchmark_hle":3412,"benchmark_ifbench":654,"benchmark_lcr":711,"benchmark_livecodebench":2382,"benchmark_math_hard":12,"benchmark_mmlu_pro":2381,"benchmark_scicode":3969,"benchmark_tau2":3666,"benchmark_terminalbench":2349,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":4818,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4819,"benchmark_bfcl_v3":12,"benchmark_bird_critic":861,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":3862,"benchmark_knights_and_knaves":12,"benchmark_math":4396,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2382,"benchmark_mmlu_pro_reasoning":2381,"benchmark_gpqa_reasoning":1156,"benchmark_aime_25_reasoning":2385,"benchmark_hle_reasoning":3412,"benchmark_scicode_reasoning":3969,"benchmark_ifbench_reasoning":654,"benchmark_lcr_reasoning":711,"benchmark_terminalbench_reasoning":2349,"benchmark_tau2_reasoning":1258,"benchmark_intelligence":4241,"benchmark_coding":3507,"benchmark_intelligence_reasoning":2384,"benchmark_coding_reasoning":2383,"benchmark_math_reasoning":2385},"04e97fde-fe24-4e02-9676-afc5011e22de","4aaf502d-cf6d-4f84-a735-155f2125b825","GLM 4.7 (Reasoning)","GLM-4.7 (Reasoning)",73.36,0.701,90.1414,88.3889,{"aa_id":4821,"ppt_model_id":4813,"slug":2375,"model_name":2376,"provider_name":4066,"name":2376,"provider":4066,"aa_name":4822,"is_open":37,"author_country":2653,"release_date":2378,"release_month":2214,"context_length":2379,"inference_mode":2654,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":2315,"input_price":324,"output_price":2315,"tokens_per_second":4823,"time_to_first_token":4824,"benchmark_aime":12,"benchmark_aime_25":4396,"benchmark_gpqa":1121,"benchmark_hle":2975,"benchmark_ifbench":1206,"benchmark_lcr":2383,"benchmark_livecodebench":2380,"benchmark_math_hard":12,"benchmark_mmlu_pro":2338,"benchmark_scicode":3430,"benchmark_tau2":3424,"benchmark_terminalbench":1203,"benchmark_accountingaudit":1398,"benchmark_agieval_zh":12,"benchmark_agieval_en":4818,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4819,"benchmark_bfcl_v3":12,"benchmark_bird_critic":861,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":3862,"benchmark_knights_and_knaves":12,"benchmark_math":4396,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_livecodebench_reasoning":2382,"benchmark_mmlu_pro_reasoning":2381,"benchmark_gpqa_reasoning":1156,"benchmark_aime_25_reasoning":2385,"benchmark_hle_reasoning":3412,"benchmark_scicode_reasoning":3969,"benchmark_ifbench_reasoning":654,"benchmark_lcr_reasoning":711,"benchmark_terminalbench_reasoning":2349,"benchmark_tau2_reasoning":1258,"benchmark_intelligence":4241,"benchmark_coding":3507,"benchmark_intelligence_reasoning":2384,"benchmark_coding_reasoning":2383,"benchmark_math_reasoning":2385},"5f32cbce-a040-4194-ae51-973e9939aaa9","GLM-4.7 (Non-reasoning)",74.82,0.647,{"aa_id":4826,"ppt_model_id":4827,"slug":2388,"model_name":2389,"provider_name":3889,"name":2389,"provider":3889,"aa_name":4828,"is_open":37,"author_country":2817,"release_date":2391,"release_month":2214,"context_length":2061,"inference_mode":2654,"input_price_per_1m_tokens":1626,"output_price_per_1m_tokens":2392,"input_price":1626,"output_price":2392,"tokens_per_second":4829,"time_to_first_token":4830,"benchmark_aime":12,"benchmark_aime_25":3561,"benchmark_gpqa":2393,"benchmark_hle":1420,"benchmark_ifbench":4300,"benchmark_lcr":623,"benchmark_livecodebench":690,"benchmark_math_hard":12,"benchmark_mmlu_pro":1930,"benchmark_scicode":3773,"benchmark_tau2":4190,"benchmark_terminalbench":3053,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4831,"benchmark_bfcl_v3":12,"benchmark_bird_critic":4832,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":3372,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1165,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":148,"benchmark_coding":1013},"6e68504f-6e60-4de3-8507-291256134b50","b9b79bdc-1699-49e3-a89d-8f3e596d77fc","MiniMax-M2.1",60.424,1.558,85.0253,25.6667,{"aa_id":4834,"ppt_model_id":4835,"slug":2409,"model_name":2410,"provider_name":3400,"name":2410,"provider":3400,"aa_name":2410,"is_open":37,"author_country":2653,"release_date":2412,"release_month":2413,"context_length":181,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":274,"input_price":377,"output_price":274,"tokens_per_second":4836,"time_to_first_token":4837,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":4838,"benchmark_hle":960,"benchmark_ifbench":2350,"benchmark_lcr":2667,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":625,"benchmark_tau2":317,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4083,"benchmark_coding":4839},"4923cb2e-79bb-423a-8aa1-d271c8eb4337","53096d2c-1fea-4852-9d12-1a7691617d94",55.863,0.252,53.900000000000006,5.6,{"aa_id":4841,"ppt_model_id":4842,"slug":2417,"model_name":2418,"provider_name":3400,"name":2418,"provider":3400,"aa_name":4843,"is_open":37,"author_country":2653,"release_date":2420,"release_month":2413,"context_length":2421,"inference_mode":2654,"input_price_per_1m_tokens":377,"output_price_per_1m_tokens":377,"input_price":377,"output_price":377,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2422,"benchmark_hle":2710,"benchmark_ifbench":4310,"benchmark_lcr":2667,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3679,"benchmark_tau2":2667,"benchmark_terminalbench":2667,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3148,"benchmark_coding":765},"6d7eec13-fab9-4dd5-9f6a-e1ba50aecf17","e49b137d-cb02-41b4-809a-0a82747b345c","Molmo2-8B",{"aa_id":4845,"ppt_model_id":4846,"slug":2425,"model_name":2426,"provider_name":9,"name":2426,"provider":9,"aa_name":4847,"is_open":11,"author_country":2653,"release_date":2428,"release_month":2413,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"tokens_per_second":4848,"time_to_first_token":4849,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2429,"benchmark_hle":3648,"benchmark_ifbench":3930,"benchmark_lcr":1356,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1206,"benchmark_tau2":4850,"benchmark_terminalbench":2022,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3676,"benchmark_coding":1124},"b412710e-4e6a-42c1-8b19-1b1c7192d51f","f34b9ff8-38f4-46e4-832e-0f354bb9c6f7","GPT-5.2 Codex (xhigh)",99.584,4.139,92.10000000000001,{"aa_id":4852,"ppt_model_id":4853,"slug":2432,"model_name":4854,"provider_name":4066,"name":2433,"provider":4066,"aa_name":4854,"is_open":37,"author_country":2653,"release_date":2435,"release_month":2413,"context_length":2379,"inference_mode":3250,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":536,"input_price":41,"output_price":536,"tokens_per_second":4855,"time_to_first_token":4856,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":4857,"benchmark_hle":3651,"benchmark_ifbench":4858,"benchmark_lcr":2732,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":917,"benchmark_tau2":4859,"benchmark_terminalbench":995,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4860,"benchmark_bbh":12,"benchmark_bfcl_v3":4861,"benchmark_bird_critic":174,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3285,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":2436,"benchmark_hle_reasoning":3651,"benchmark_scicode_reasoning":917,"benchmark_ifbench_reasoning":4858,"benchmark_lcr_reasoning":2732,"benchmark_terminalbench_reasoning":995,"benchmark_tau2_reasoning":4859,"benchmark_intelligence":447,"benchmark_coding":448,"benchmark_intelligence_reasoning":2437,"benchmark_coding_reasoning":301},"08c3b5dc-479f-4cbd-a510-6ea14641b87f","f1338d50-7a2e-468c-b9bf-647280d7edd9","GLM-4.7-Flash (Reasoning)",85.63,0.713,58.099999999999994,60.8,98.8,26.615,74.5553,{"aa_id":4863,"ppt_model_id":4853,"slug":2432,"model_name":2433,"provider_name":4066,"name":2433,"provider":4066,"aa_name":4864,"is_open":37,"author_country":2653,"release_date":2435,"release_month":2413,"context_length":2379,"inference_mode":2654,"input_price_per_1m_tokens":41,"output_price_per_1m_tokens":536,"input_price":41,"output_price":536,"tokens_per_second":4865,"time_to_first_token":4866,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1234,"benchmark_hle":960,"benchmark_ifbench":3514,"benchmark_lcr":2742,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":426,"benchmark_tau2":4867,"benchmark_terminalbench":2934,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4860,"benchmark_bbh":12,"benchmark_bfcl_v3":4861,"benchmark_bird_critic":174,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3285,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":2436,"benchmark_hle_reasoning":3651,"benchmark_scicode_reasoning":917,"benchmark_ifbench_reasoning":4858,"benchmark_lcr_reasoning":2732,"benchmark_terminalbench_reasoning":995,"benchmark_tau2_reasoning":4859,"benchmark_intelligence":447,"benchmark_coding":448,"benchmark_intelligence_reasoning":2437,"benchmark_coding_reasoning":301},"b99b4a56-b988-4fd7-a253-ef0f25f2a01f","GLM-4.7-Flash (Non-reasoning)",91.402,0.864,91.8,{"aa_id":4869,"ppt_model_id":4870,"slug":2454,"model_name":4871,"provider_name":3988,"name":2455,"provider":3988,"aa_name":4871,"is_open":37,"author_country":2817,"release_date":2457,"release_month":2413,"context_length":1477,"inference_mode":3250,"input_price_per_1m_tokens":2458,"output_price_per_1m_tokens":2459,"input_price":2458,"output_price":2459,"tokens_per_second":4872,"time_to_first_token":4873,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2460,"benchmark_hle":3013,"benchmark_ifbench":4874,"benchmark_lcr":1764,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3676,"benchmark_tau2":3666,"benchmark_terminalbench":3429,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4875,"benchmark_bfcl_v3":4876,"benchmark_bird_critic":3472,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4877,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":2460,"benchmark_hle_reasoning":3013,"benchmark_scicode_reasoning":3676,"benchmark_ifbench_reasoning":4878,"benchmark_lcr_reasoning":1764,"benchmark_terminalbench_reasoning":3429,"benchmark_tau2_reasoning":1258,"benchmark_intelligence":3776,"benchmark_coding":3419,"benchmark_intelligence_reasoning":2462,"benchmark_coding_reasoning":2461},"8fcdd0c6-ac4c-464b-affc-993af85b3a0b","5e30509d-44e3-4061-81cf-f2d79f239194","Kimi K2.5 (Reasoning)",33.608,4.091,70.19999999999999,90.9845,64.535,92.6063,70.2,{"aa_id":4880,"ppt_model_id":4870,"slug":2454,"model_name":2455,"provider_name":3988,"name":2455,"provider":3988,"aa_name":4881,"is_open":37,"author_country":2817,"release_date":2457,"release_month":2413,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":2458,"output_price_per_1m_tokens":2459,"input_price":2458,"output_price":2459,"tokens_per_second":4882,"time_to_first_token":4883,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":279,"benchmark_hle":2685,"benchmark_ifbench":1136,"benchmark_lcr":623,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3803,"benchmark_tau2":1166,"benchmark_terminalbench":2711,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4875,"benchmark_bfcl_v3":4876,"benchmark_bird_critic":3472,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":4877,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":2460,"benchmark_hle_reasoning":3013,"benchmark_scicode_reasoning":3676,"benchmark_ifbench_reasoning":4878,"benchmark_lcr_reasoning":1764,"benchmark_terminalbench_reasoning":3429,"benchmark_tau2_reasoning":1258,"benchmark_intelligence":3776,"benchmark_coding":3419,"benchmark_intelligence_reasoning":2462,"benchmark_coding_reasoning":2461},"6edd5aa8-874b-430d-8795-8e90763c3866","Kimi K2.5 (Non-reasoning)",31.145,3.798,{"aa_id":4885,"ppt_model_id":4886,"slug":2465,"model_name":2466,"provider_name":4887,"name":2466,"provider":4887,"aa_name":2466,"is_open":37,"author_country":2817,"release_date":2469,"release_month":2413,"context_length":981,"inference_mode":2654,"input_price_per_1m_tokens":495,"output_price_per_1m_tokens":50,"input_price":495,"output_price":50,"tokens_per_second":4888,"time_to_first_token":4889,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1376,"benchmark_hle":4674,"benchmark_ifbench":3760,"benchmark_lcr":1124,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3517,"benchmark_tau2":4890,"benchmark_terminalbench":3777,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3892,"benchmark_coding":2964},"ce496881-6074-4d84-8244-c3bfec559cc8","221e772f-a228-4e47-b0e8-74017a2ac38e","StepFun",84.008,2.568,94.39999999999999,{"aa_id":4892,"ppt_model_id":4893,"slug":2472,"model_name":2473,"provider_name":1833,"name":2473,"provider":1833,"aa_name":2473,"is_open":37,"author_country":2817,"release_date":2475,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":411,"output_price_per_1m_tokens":60,"input_price":411,"output_price":60,"tokens_per_second":4894,"time_to_first_token":4756,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":160,"benchmark_hle":450,"benchmark_ifbench":4231,"benchmark_lcr":1201,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3906,"benchmark_tau2":721,"benchmark_terminalbench":4222,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1059,"benchmark_coding":3519},"0bee3913-9b1b-48f4-b5b4-fe703971f924","d8ff0406-c59d-4cc9-bff3-4195694f6511",157.018,{"aa_id":4896,"ppt_model_id":4897,"slug":2479,"model_name":4898,"provider_name":138,"name":2480,"provider":138,"aa_name":4899,"is_open":11,"author_country":2653,"release_date":2482,"release_month":2476,"context_length":792,"inference_mode":3250,"input_price_per_1m_tokens":505,"output_price_per_1m_tokens":174,"input_price":505,"output_price":174,"tokens_per_second":4900,"time_to_first_token":4901,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":4691,"benchmark_hle":1686,"benchmark_ifbench":613,"benchmark_lcr":1024,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":304,"benchmark_tau2":4850,"benchmark_terminalbench":27,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4902,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":1357,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4903,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4904,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":2223,"benchmark_hle_reasoning":1686,"benchmark_scicode_reasoning":304,"benchmark_ifbench_reasoning":613,"benchmark_lcr_reasoning":1024,"benchmark_terminalbench_reasoning":27,"benchmark_tau2_reasoning":4905,"benchmark_intelligence":484,"benchmark_coding":300,"benchmark_intelligence_reasoning":2483,"benchmark_coding_reasoning":1984},"77fb5a04-7d8d-4049-b9c8-b0c7071ece3c","9652d719-6040-4b1c-81d1-53a664a839fc","Claude Opus 4.6 (Reasoning)","Claude Opus 4.6 (Adaptive Reasoning, Max Effort)",48.01,8.972,49.2478,95.58,62.6667,92.1,{"aa_id":4907,"ppt_model_id":4897,"slug":2479,"model_name":2480,"provider_name":138,"name":2480,"provider":138,"aa_name":4908,"is_open":11,"author_country":2653,"release_date":2482,"release_month":2476,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":505,"output_price_per_1m_tokens":174,"input_price":505,"output_price":174,"tokens_per_second":4909,"time_to_first_token":4910,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1190,"benchmark_hle":1755,"benchmark_ifbench":4381,"benchmark_lcr":4147,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1134,"benchmark_tau2":1112,"benchmark_terminalbench":4911,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":4902,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":1357,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4903,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4904,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":2223,"benchmark_hle_reasoning":1686,"benchmark_scicode_reasoning":304,"benchmark_ifbench_reasoning":613,"benchmark_lcr_reasoning":1024,"benchmark_terminalbench_reasoning":27,"benchmark_tau2_reasoning":4905,"benchmark_intelligence":484,"benchmark_coding":300,"benchmark_intelligence_reasoning":2483,"benchmark_coding_reasoning":1984},"f1c29340-1db7-4217-b78c-ccb523ac25ea","Claude Opus 4.6 (Non-reasoning, High Effort)",45.646,1.729,48.5,{"aa_id":4913,"ppt_model_id":4914,"slug":2486,"model_name":4915,"provider_name":1833,"name":2487,"provider":1833,"aa_name":2487,"is_open":11,"author_country":2817,"release_date":2489,"release_month":2476,"context_length":1477,"inference_mode":3250,"input_price_per_1m_tokens":794,"output_price_per_1m_tokens":1875,"input_price":794,"output_price":1875,"tokens_per_second":4916,"time_to_first_token":4917,"benchmark_aime":12,"benchmark_aime_25":1419,"benchmark_gpqa":1685,"benchmark_hle":2836,"benchmark_ifbench":1024,"benchmark_lcr":1145,"benchmark_livecodebench":903,"benchmark_math_hard":12,"benchmark_mmlu_pro":1525,"benchmark_scicode":4440,"benchmark_tau2":1375,"benchmark_terminalbench":4267,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1419,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":1685,"benchmark_hle_reasoning":916,"benchmark_scicode_reasoning":4440,"benchmark_ifbench_reasoning":1024,"benchmark_lcr_reasoning":1145,"benchmark_terminalbench_reasoning":4267,"benchmark_tau2_reasoning":1375,"benchmark_intelligence":1944,"benchmark_coding":4127,"benchmark_intelligence_reasoning":2164,"benchmark_coding_reasoning":315},"d3d4a7cb-dc3f-47a0-b196-ba08e4d41d2d","6efe9a57-a829-4241-86b9-db3ade53cbc0","Qwen3 Max Thinking (Reasoning)",36.878,1.661,{"aa_id":4919,"ppt_model_id":4914,"slug":2486,"model_name":2487,"provider_name":1833,"name":2487,"provider":1833,"aa_name":4920,"is_open":11,"author_country":2817,"release_date":2489,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":794,"output_price_per_1m_tokens":1875,"input_price":794,"output_price":1875,"tokens_per_second":4921,"time_to_first_token":4922,"benchmark_aime":12,"benchmark_aime_25":1419,"benchmark_gpqa":3930,"benchmark_hle":558,"benchmark_ifbench":2806,"benchmark_lcr":4232,"benchmark_livecodebench":903,"benchmark_math_hard":12,"benchmark_mmlu_pro":4005,"benchmark_scicode":118,"benchmark_tau2":1375,"benchmark_terminalbench":1191,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":1419,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":1685,"benchmark_hle_reasoning":916,"benchmark_scicode_reasoning":4440,"benchmark_ifbench_reasoning":1024,"benchmark_lcr_reasoning":1145,"benchmark_terminalbench_reasoning":4267,"benchmark_tau2_reasoning":1375,"benchmark_intelligence":1944,"benchmark_coding":4127,"benchmark_intelligence_reasoning":2164,"benchmark_coding_reasoning":315},"9b909945-eed9-47d5-92dd-162d51c9e42e","Qwen3 Max Thinking (Preview)",41.94,1.804,{"aa_id":4924,"ppt_model_id":4925,"slug":2492,"model_name":4926,"provider_name":4066,"name":2493,"provider":4066,"aa_name":4927,"is_open":37,"author_country":2653,"release_date":2495,"release_month":2476,"context_length":2379,"inference_mode":3250,"input_price_per_1m_tokens":2496,"output_price_per_1m_tokens":363,"input_price":2496,"output_price":363,"tokens_per_second":4928,"time_to_first_token":4929,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1192,"benchmark_hle":3597,"benchmark_ifbench":656,"benchmark_lcr":809,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":27,"benchmark_tau2":1355,"benchmark_terminalbench":4613,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4930,"benchmark_arc_challenge":4931,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4932,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4933,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":4934,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":3016,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":1192,"benchmark_hle_reasoning":4935,"benchmark_scicode_reasoning":27,"benchmark_ifbench_reasoning":656,"benchmark_lcr_reasoning":809,"benchmark_terminalbench_reasoning":4613,"benchmark_tau2_reasoning":1355,"benchmark_intelligence":1239,"benchmark_coding":1071,"benchmark_intelligence_reasoning":635,"benchmark_coding_reasoning":2497},"26b6b925-9dfd-4a8b-8da4-359825461542","adccd3de-b10c-4ba8-9543-d4415c20c82f","GLM 5 (Reasoning)","GLM-5 (Reasoning)",57.265,0.934,89.0809,95.9898,94.2866,94.02,91.7177,27.2,{"aa_id":4937,"ppt_model_id":4925,"slug":2492,"model_name":2493,"provider_name":4066,"name":2493,"provider":4066,"aa_name":4938,"is_open":37,"author_country":2653,"release_date":2495,"release_month":2476,"context_length":2379,"inference_mode":2654,"input_price_per_1m_tokens":2496,"output_price_per_1m_tokens":363,"input_price":2496,"output_price":363,"tokens_per_second":4939,"time_to_first_token":4940,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":3525,"benchmark_hle":4941,"benchmark_ifbench":4942,"benchmark_lcr":4397,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":388,"benchmark_tau2":4943,"benchmark_terminalbench":148,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4930,"benchmark_arc_challenge":4931,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4932,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3952,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":4933,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":4934,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":3016,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_gpqa_reasoning":1192,"benchmark_hle_reasoning":4935,"benchmark_scicode_reasoning":27,"benchmark_ifbench_reasoning":656,"benchmark_lcr_reasoning":809,"benchmark_terminalbench_reasoning":4613,"benchmark_tau2_reasoning":1355,"benchmark_intelligence":1239,"benchmark_coding":1071,"benchmark_intelligence_reasoning":635,"benchmark_coding_reasoning":2497},"a2bff639-9d47-43e4-a384-fbe6129cb077","GLM-5 (Non-reasoning)",58.244,1.154,7.199999999999999,55.2,97.39999999999999,{"aa_id":4945,"ppt_model_id":4946,"slug":2500,"model_name":2501,"provider_name":3889,"name":2501,"provider":3889,"aa_name":4947,"is_open":37,"author_country":2817,"release_date":2503,"release_month":2476,"context_length":2061,"inference_mode":2654,"input_price_per_1m_tokens":2504,"output_price_per_1m_tokens":2392,"input_price":2504,"output_price":2392,"tokens_per_second":4948,"time_to_first_token":4949,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1112,"benchmark_hle":4674,"benchmark_ifbench":4950,"benchmark_lcr":1145,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":276,"benchmark_tau2":4951,"benchmark_terminalbench":3429,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":2954,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4952,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":4953,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4954,"benchmark_coding":145},"50d53952-c066-4c79-9aca-03900a5c652e","9e395aa4-49e3-43a9-a527-d3565c5f1468","MiniMax-M2.5",59.386,1.171,71.6,95.3,84.5185,56.3333,41.9,{"aa_id":4956,"ppt_model_id":4957,"slug":2507,"model_name":2508,"provider_name":1833,"name":2508,"provider":1833,"aa_name":4958,"is_open":37,"author_country":2817,"release_date":2510,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":312,"input_price":324,"output_price":312,"tokens_per_second":4959,"time_to_first_token":4960,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":973,"benchmark_hle":3777,"benchmark_ifbench":1571,"benchmark_lcr":1108,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1645,"benchmark_tau2":4961,"benchmark_terminalbench":326,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4962,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4963,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4964,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":436,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":360,"benchmark_coding":145},"a38f7ea6-b683-4969-978e-4f317e16b4e5","a65e22c0-c7f4-4fd9-9441-44d1fdcc23e1","Qwen3.5 397B A17B (Reasoning)",55.61,1.381,95.6,91.4375,89.4333,21.7778,{"aa_id":4966,"ppt_model_id":4957,"slug":2507,"model_name":2508,"provider_name":1833,"name":2508,"provider":1833,"aa_name":4967,"is_open":37,"author_country":2817,"release_date":2510,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":324,"output_price_per_1m_tokens":312,"input_price":324,"output_price":312,"tokens_per_second":4968,"time_to_first_token":4969,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1685,"benchmark_hle":361,"benchmark_ifbench":449,"benchmark_lcr":3640,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":4207,"benchmark_tau2":4571,"benchmark_terminalbench":4453,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4962,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4963,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3573,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4964,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":436,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":360,"benchmark_coding":145},"e4c784fc-5d09-49a7-bc2a-f23a24d2772a","Qwen3.5 397B A17B (Non-reasoning)",50.881,1.39,{"aa_id":12,"ppt_model_id":4971,"slug":2513,"model_name":2514,"provider_name":375,"name":2514,"provider":375,"aa_name":12,"is_open":11,"author_country":2817,"release_date":2516,"release_month":2476,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":2517,"input_price":793,"output_price":2517,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4972,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4973,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":3533,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4974,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":2667,"benchmark_wmdp":12,"benchmark_wmt":12},"0e1bb15b-3774-490a-858d-6f6fa47cf634",77.8083,90.5698,13.1111,{"aa_id":4976,"ppt_model_id":4977,"slug":2520,"model_name":2521,"provider_name":138,"name":2521,"provider":138,"aa_name":4978,"is_open":11,"author_country":2653,"release_date":2523,"release_month":2476,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":4979,"time_to_first_token":4980,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1930,"benchmark_hle":16,"benchmark_ifbench":4727,"benchmark_lcr":1024,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":4981,"benchmark_tau2":1356,"benchmark_terminalbench":2483,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4982,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4983,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4181,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":276,"benchmark_coding":1124},"12b9868c-e47e-42a8-9eaf-2272c0de492a","ca4f2f46-caa8-4008-a230-dc3fb131c5be","Claude Sonnet 4.6 (Adaptive Reasoning, Max Effort)",55.173,42.758,46.800000000000004,89.513,90.2626,{"aa_id":4985,"ppt_model_id":4977,"slug":2520,"model_name":2521,"provider_name":138,"name":2521,"provider":138,"aa_name":4986,"is_open":11,"author_country":2653,"release_date":2523,"release_month":2476,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":4987,"time_to_first_token":4988,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2293,"benchmark_hle":2792,"benchmark_ifbench":3891,"benchmark_lcr":4232,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3826,"benchmark_tau2":721,"benchmark_terminalbench":27,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4982,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4983,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4181,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":276,"benchmark_coding":1124},"9b42e21c-de45-4dea-8575-977f84ebbdd3","Claude Sonnet 4.6 (Non-reasoning, High Effort)",47.214,1.751,{"aa_id":4990,"ppt_model_id":4977,"slug":2520,"model_name":2521,"provider_name":138,"name":2521,"provider":138,"aa_name":4991,"is_open":11,"author_country":2653,"release_date":2523,"release_month":2476,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":68,"output_price_per_1m_tokens":161,"input_price":68,"output_price":161,"tokens_per_second":4992,"time_to_first_token":4993,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1921,"benchmark_hle":2900,"benchmark_ifbench":879,"benchmark_lcr":3199,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":30,"benchmark_tau2":279,"benchmark_terminalbench":879,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4982,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":4983,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":4181,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":276,"benchmark_coding":1124},"667c3d52-8f3c-4f57-96c0-3d9b4dc8ba75","Claude Sonnet 4.6 (Non-reasoning, Low Effort)",46.586,1.723,{"aa_id":12,"ppt_model_id":4995,"slug":2526,"model_name":2527,"provider_name":248,"name":2527,"provider":248,"aa_name":12,"is_open":11,"author_country":2653,"release_date":2529,"release_month":2476,"context_length":856,"inference_mode":2654,"input_price_per_1m_tokens":78,"output_price_per_1m_tokens":558,"input_price":78,"output_price":558,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":4996,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"1a482268-b0d5-47fc-8593-e65d0f675276",93.9906,{"aa_id":4998,"ppt_model_id":4999,"slug":2538,"model_name":2539,"provider_name":9,"name":2539,"provider":9,"aa_name":5000,"is_open":11,"author_country":2653,"release_date":2541,"release_month":2476,"context_length":1669,"inference_mode":2654,"input_price_per_1m_tokens":2315,"output_price_per_1m_tokens":439,"input_price":2315,"output_price":439,"tokens_per_second":5001,"time_to_first_token":5002,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2542,"benchmark_hle":3176,"benchmark_ifbench":4176,"benchmark_lcr":4580,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":4062,"benchmark_tau2":5003,"benchmark_terminalbench":2483,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":5004,"benchmark_coding":613},"53bbf671-e75d-459e-9765-0c69cd5f532f","b6cfc021-7b0e-4d19-aaed-7084501ab042","GPT-5.3 Codex (xhigh)",65.313,73.285,90.9,54,{"aa_id":12,"ppt_model_id":5006,"slug":2557,"model_name":2558,"provider_name":375,"name":2558,"provider":375,"aa_name":12,"is_open":11,"author_country":2817,"release_date":2560,"release_month":2476,"context_length":792,"inference_mode":2654,"input_price_per_1m_tokens":687,"output_price_per_1m_tokens":793,"input_price":687,"output_price":793,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5007,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5008,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5009,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"66649dd4-7e27-42ca-a957-188cbc69df2c",89.4737,90.6159,76.7778,{"aa_id":5011,"ppt_model_id":5012,"slug":2563,"model_name":2564,"provider_name":1833,"name":2564,"provider":1833,"aa_name":5013,"is_open":37,"author_country":2817,"release_date":2566,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":820,"input_price":793,"output_price":820,"tokens_per_second":5014,"time_to_first_token":5015,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":5016,"benchmark_hle":2744,"benchmark_ifbench":1356,"benchmark_lcr":3690,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1645,"benchmark_tau2":5017,"benchmark_terminalbench":3761,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5018,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5019,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5020,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":784,"benchmark_coding":2964},"b7d3a288-4649-41de-ae1f-dcb818381154","096c3b3f-4e86-4089-8c89-e026de5bbf17","Qwen3.5 122B A10B (Reasoning)",131.447,1.071,85.7,93.60000000000001,90.2592,92.6739,78.1111,{"aa_id":5022,"ppt_model_id":5012,"slug":2563,"model_name":2564,"provider_name":1833,"name":2564,"provider":1833,"aa_name":5023,"is_open":37,"author_country":2817,"release_date":2566,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":793,"output_price_per_1m_tokens":820,"input_price":793,"output_price":820,"tokens_per_second":5024,"time_to_first_token":5025,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":3561,"benchmark_hle":2700,"benchmark_ifbench":5026,"benchmark_lcr":5027,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":4453,"benchmark_tau2":1399,"benchmark_terminalbench":556,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5018,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5019,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5020,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":784,"benchmark_coding":2964},"6c9eefa0-222f-47c5-93bb-522f4948aaca","Qwen3.5 122B A10B (Non-reasoning)",132.202,1.007,50.8,56.00000000000001,{"aa_id":5029,"ppt_model_id":5030,"slug":2569,"model_name":2570,"provider_name":1833,"name":2570,"provider":1833,"aa_name":5031,"is_open":37,"author_country":2817,"release_date":2572,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":1827,"output_price_per_1m_tokens":312,"input_price":1827,"output_price":312,"tokens_per_second":5032,"time_to_first_token":5033,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":416,"benchmark_hle":1420,"benchmark_ifbench":4192,"benchmark_lcr":4070,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":2461,"benchmark_tau2":5034,"benchmark_terminalbench":1111,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5035,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5036,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5037,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4620,"benchmark_coding":859},"ad17de76-698a-4ccc-a503-008c2599f650","f9ce3f37-10b6-4b40-b664-1581529ecc89","Qwen3.5 27B (Reasoning)",87.723,1.313,93.89999999999999,90.6127,92.3514,77.5556,{"aa_id":5039,"ppt_model_id":5030,"slug":2569,"model_name":2570,"provider_name":1833,"name":2570,"provider":1833,"aa_name":5040,"is_open":37,"author_country":2817,"release_date":2572,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":1827,"output_price_per_1m_tokens":312,"input_price":1827,"output_price":312,"tokens_per_second":5041,"time_to_first_token":5042,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":513,"benchmark_hle":2792,"benchmark_ifbench":3826,"benchmark_lcr":915,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1686,"benchmark_tau2":1221,"benchmark_terminalbench":2349,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5035,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5036,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5037,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4620,"benchmark_coding":859},"cf4d0234-dc61-48cc-a26e-582f44b974c3","Qwen3.5 27B (Non-reasoning)",87.818,1.327,{"aa_id":5044,"ppt_model_id":5045,"slug":2575,"model_name":2576,"provider_name":1833,"name":2576,"provider":1833,"aa_name":5046,"is_open":37,"author_country":2817,"release_date":2578,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":2579,"output_price_per_1m_tokens":312,"input_price":2579,"output_price":312,"tokens_per_second":5047,"time_to_first_token":5048,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1399,"benchmark_hle":2295,"benchmark_ifbench":5049,"benchmark_lcr":4588,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3692,"benchmark_tau2":5050,"benchmark_terminalbench":3411,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5007,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5051,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5052,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2896,"benchmark_coding":3658},"f1a164d5-3d89-42a4-96ed-3b11b1663c20","0dba8c58-9e0c-4e84-9588-c35b08e261eb","Qwen3.5 35B A3B (Reasoning)",115.293,1.083,72.5,89.2,90.8309,76.4444,{"aa_id":5054,"ppt_model_id":5045,"slug":2575,"model_name":2576,"provider_name":1833,"name":2576,"provider":1833,"aa_name":5055,"is_open":37,"author_country":2817,"release_date":2578,"release_month":2476,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":2579,"output_price_per_1m_tokens":312,"input_price":2579,"output_price":312,"tokens_per_second":5056,"time_to_first_token":5057,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":3365,"benchmark_hle":2657,"benchmark_ifbench":5058,"benchmark_lcr":5059,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":2973,"benchmark_tau2":1253,"benchmark_terminalbench":2812,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":5007,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":5051,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":5052,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2896,"benchmark_coding":3658},"f47bd28a-ea44-42ad-9caa-91ac1063f108","Qwen3.5 35B A3B (Non-reasoning)",124.352,1.023,44.5,55.300000000000004,{"aa_id":5061,"ppt_model_id":5062,"slug":2601,"model_name":2602,"provider_name":1277,"name":2602,"provider":1277,"aa_name":2602,"is_open":37,"author_country":5063,"release_date":2604,"release_month":2592,"context_length":129,"inference_mode":2654,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":60,"input_price":143,"output_price":60,"tokens_per_second":5064,"time_to_first_token":5065,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":771,"benchmark_hle":3151,"benchmark_ifbench":5066,"benchmark_lcr":2383,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":118,"benchmark_tau2":710,"benchmark_terminalbench":3411,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":1013,"benchmark_coding":3767},"3521c0d7-c188-451c-bea7-b1286f1ae6f0","ff74d893-90eb-465b-a794-b9b70cb2c24b","ae",752.705,3.87,69.8,{"aa_id":5068,"ppt_model_id":5069,"slug":2607,"model_name":2608,"provider_name":9,"name":2608,"provider":9,"aa_name":5070,"is_open":11,"author_country":2653,"release_date":2610,"release_month":2592,"context_length":2611,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":161,"input_price":220,"output_price":161,"tokens_per_second":5071,"time_to_first_token":5072,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2216,"benchmark_hle":3713,"benchmark_ifbench":745,"benchmark_lcr":4580,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":4727,"benchmark_tau2":2542,"benchmark_terminalbench":5073,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3430,"benchmark_coding":810},"083f3ea3-19f9-4675-baf5-c6ca080cab86","50a322eb-331c-4271-a1c7-1eb81844b41d","GPT-5.4 (xhigh)",73.821,154.615,57.599999999999994,{"aa_id":5075,"ppt_model_id":5069,"slug":2607,"model_name":2608,"provider_name":9,"name":2608,"provider":9,"aa_name":5076,"is_open":11,"author_country":2653,"release_date":2610,"release_month":2592,"context_length":2611,"inference_mode":2654,"input_price_per_1m_tokens":220,"output_price_per_1m_tokens":161,"input_price":220,"output_price":161,"tokens_per_second":5077,"time_to_first_token":5078,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":767,"benchmark_hle":2812,"benchmark_ifbench":673,"benchmark_lcr":892,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3052,"benchmark_tau2":2674,"benchmark_terminalbench":198,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3430,"benchmark_coding":810},"7ec65ec7-d0cb-4b44-9197-03ca625a566d","GPT-5.4 (Non-reasoning)",59.113,0.584,{"aa_id":5080,"ppt_model_id":5081,"slug":2614,"model_name":2615,"provider_name":9,"name":2615,"provider":9,"aa_name":5082,"is_open":11,"author_country":2653,"release_date":2617,"release_month":2592,"context_length":2611,"inference_mode":2654,"input_price_per_1m_tokens":16,"output_price_per_1m_tokens":2618,"input_price":16,"output_price":2618,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":12,"benchmark_hle":12,"benchmark_ifbench":12,"benchmark_lcr":12,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":12,"benchmark_tau2":12,"benchmark_terminalbench":12,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12},"bb1a9d61-8a4b-437d-ba7d-fe68f624a05d","be832d32-7ebe-4146-a876-06ae6a07ad3e","GPT-5.4 Pro (xhigh)",{"aa_id":5084,"ppt_model_id":5085,"slug":2621,"model_name":2622,"provider_name":1833,"name":2622,"provider":1833,"aa_name":5086,"is_open":37,"author_country":2817,"release_date":2624,"release_month":2592,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":273,"input_price":208,"output_price":273,"tokens_per_second":5087,"time_to_first_token":3513,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":3526,"benchmark_hle":3679,"benchmark_ifbench":3690,"benchmark_lcr":623,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3326,"benchmark_tau2":2348,"benchmark_terminalbench":4267,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3777,"benchmark_coding":5088},"013064eb-90ed-4781-9ec6-173869643c1e","68865bdd-0c47-46e2-bc8d-5b65ea94d7ea","Qwen3.5 9B (Reasoning)",163.868,21.4,{"aa_id":5090,"ppt_model_id":5085,"slug":2621,"model_name":2622,"provider_name":1833,"name":2622,"provider":1833,"aa_name":5091,"is_open":37,"author_country":2817,"release_date":2624,"release_month":2592,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":208,"output_price_per_1m_tokens":273,"input_price":208,"output_price":273,"tokens_per_second":5092,"time_to_first_token":5093,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2982,"benchmark_hle":4439,"benchmark_ifbench":3892,"benchmark_lcr":3774,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":3292,"benchmark_tau2":1744,"benchmark_terminalbench":4222,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":3777,"benchmark_coding":5088},"c659dd40-fb47-43ab-9f75-09ee4fe4c25e","Qwen3.5 9B (Non-reasoning)",187.424,0.542,{"aa_id":5095,"ppt_model_id":5096,"slug":2627,"model_name":2628,"provider_name":5097,"name":2628,"provider":5097,"aa_name":5098,"is_open":11,"author_country":2817,"release_date":2630,"release_month":2592,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":143,"output_price_per_1m_tokens":78,"input_price":143,"output_price":78,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":3279,"benchmark_hle":995,"benchmark_ifbench":5099,"benchmark_lcr":1182,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":488,"benchmark_tau2":1527,"benchmark_terminalbench":2295,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2383,"benchmark_coding":5088},"20b02309-0c41-441c-b3a1-baddc9955e4d","e6e2e575-8967-4fdd-8af9-d80196ba3df7","ByteDance Seed","Doubao Seed 2.0 lite (Reasoning)",61.199999999999996,{"aa_id":5101,"ppt_model_id":5102,"slug":2633,"model_name":2634,"provider_name":4066,"name":2634,"provider":4066,"aa_name":5103,"is_open":11,"author_country":2653,"release_date":2636,"release_month":2592,"context_length":2379,"inference_mode":2654,"input_price_per_1m_tokens":182,"output_price_per_1m_tokens":69,"input_price":182,"output_price":69,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1844,"benchmark_hle":1511,"benchmark_ifbench":313,"benchmark_lcr":3251,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":4049,"benchmark_tau2":870,"benchmark_terminalbench":3213,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":2462,"benchmark_coding":3827},"0cb7dbc1-33a6-4920-9573-94ae1450496a","faeb05d7-ff38-4a77-ab1f-70c01fd21f3d","GLM-5-Turbo",{"aa_id":5105,"ppt_model_id":5106,"slug":2639,"model_name":2640,"provider_name":3889,"name":2640,"provider":3889,"aa_name":5107,"is_open":11,"author_country":2817,"release_date":2642,"release_month":2592,"context_length":1939,"inference_mode":2654,"input_price_per_1m_tokens":50,"output_price_per_1m_tokens":182,"input_price":50,"output_price":182,"tokens_per_second":5108,"time_to_first_token":5109,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":2323,"benchmark_hle":3366,"benchmark_ifbench":1356,"benchmark_lcr":749,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1219,"benchmark_tau2":1112,"benchmark_terminalbench":148,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":5110,"benchmark_coding":4954},"2faca2e8-9af1-490e-b648-1bdb42d0a72f","0f8a5b79-9d63-4221-9a5a-a3bac0a284d4","MiniMax-M2.7",40.057,2.093,49.6,{"aa_id":5112,"ppt_model_id":5113,"slug":2645,"model_name":2646,"provider_name":2344,"name":2646,"provider":2344,"aa_name":5114,"is_open":11,"author_country":2817,"release_date":2648,"release_month":2592,"context_length":1477,"inference_mode":2654,"input_price_per_1m_tokens":536,"output_price_per_1m_tokens":78,"input_price":536,"output_price":78,"tokens_per_second":12,"time_to_first_token":12,"benchmark_aime":12,"benchmark_aime_25":12,"benchmark_gpqa":1187,"benchmark_hle":3982,"benchmark_ifbench":903,"benchmark_lcr":3690,"benchmark_livecodebench":12,"benchmark_math_hard":12,"benchmark_mmlu_pro":12,"benchmark_scicode":1686,"benchmark_tau2":5115,"benchmark_terminalbench":3429,"benchmark_accountingaudit":12,"benchmark_agieval_zh":12,"benchmark_agieval_en":12,"benchmark_arc_challenge":12,"benchmark_arc_easy":12,"benchmark_bbeh":12,"benchmark_bbh":12,"benchmark_bfcl_v3":12,"benchmark_bird_critic":12,"benchmark_darkbench":12,"benchmark_formal_logic_exp":12,"benchmark_gaia":12,"benchmark_gsm8k":12,"benchmark_humaneval":12,"benchmark_ifeval":12,"benchmark_knights_and_knaves":12,"benchmark_math":12,"benchmark_mbppplus":12,"benchmark_medqa":12,"benchmark_mmlu":12,"benchmark_mmmu":12,"benchmark_multichallenge":12,"benchmark_simpleqa":12,"benchmark_stock_bcs":12,"benchmark_swe_bench_lite":12,"benchmark_wmdp":12,"benchmark_wmt":12,"benchmark_intelligence":4475,"benchmark_coding":5116},"aed82eff-96a4-4652-86fd-2754df9c6e96","6190c93a-00f4-4122-98ad-b2ac07badb51","MiMo-V2-Omni",91.2,35.5,[5118,5132,5144,5156,5169,5181,5194,5206,5218,5230,5243,5255,5267,5280,5292,5303,5315,5326,5338,5349,5360,5371,5382,5393,5404,5415,5426,5437,5449,5460,5471,5482,5493,5504,5515,5526,5537,5548,5559],{"slug":5119,"field":5120,"name":5121,"description":5122,"categories":5123,"model_count":5125,"source":5126,"top_models":5127},"gpqa","benchmark_gpqa","GPQA","Graduate-level multiple-choice questions written by domain experts in biology, physics, and chemistry. Questions are Google-proof and extremely difficult.",[5124],"Reasoning and Logic",239,"artificial_analysis",[5128,5129,5130,5131],{"name":2608,"provider":9,"score":2216,"inference_mode":2654},{"name":2539,"provider":9,"score":2542,"inference_mode":2654},{"name":2151,"provider":248,"score":2155,"inference_mode":2654},{"name":2319,"provider":9,"score":1169,"inference_mode":2654},{"slug":5133,"field":5134,"name":5135,"description":5136,"categories":5137,"model_count":5138,"source":5126,"top_models":5139},"hle","benchmark_hle","Humanity's Last Exam","Humanity's Last Exam — extremely challenging questions designed to test the upper limits of AI capability across diverse domains.",[5124],238,[5140,5141,5142,5143],{"name":2608,"provider":9,"score":3713,"inference_mode":2654},{"name":2539,"provider":9,"score":3176,"inference_mode":2654},{"name":2151,"provider":248,"score":4620,"inference_mode":2654},{"name":2480,"provider":138,"score":1686,"inference_mode":3250},{"slug":5145,"field":5146,"name":5147,"description":5148,"categories":5149,"model_count":5138,"source":5126,"top_models":5151},"scicode","benchmark_scicode","SciCode","Science coding benchmark measuring AI ability to solve scientific computing tasks.",[5150],"Computer Science and Programming",[5152,5153,5154,5155],{"name":2608,"provider":9,"score":4727,"inference_mode":2654},{"name":2151,"provider":248,"score":4486,"inference_mode":2654},{"name":2426,"provider":9,"score":1206,"inference_mode":2654},{"name":2539,"provider":9,"score":4062,"inference_mode":2654},{"slug":5157,"field":5158,"name":5159,"description":5160,"categories":5161,"model_count":5163,"source":5126,"top_models":5164},"ifbench","benchmark_ifbench","IFBench","Instruction Following Benchmark measuring LLM ability to adhere to nuanced writing constraints and formatting requirements.",[5162],"Instruction Following",218,[5165,5166,5167,5168],{"name":2508,"provider":1833,"score":1571,"inference_mode":2654},{"name":2367,"provider":248,"score":1943,"inference_mode":3250},{"name":2426,"provider":9,"score":3930,"inference_mode":2654},{"name":2564,"provider":1833,"score":1356,"inference_mode":2654},{"slug":5170,"field":5171,"name":5172,"description":5173,"categories":5174,"model_count":5175,"source":5126,"top_models":5176},"lcr","benchmark_lcr","LCR","Long Context Retrieval benchmark testing ability to find and use information in very long documents.",[5124],217,[5177,5178,5179,5180],{"name":2426,"provider":9,"score":1356,"inference_mode":2654},{"name":1681,"provider":9,"score":4192,"inference_mode":2654},{"name":2137,"provider":9,"score":1351,"inference_mode":2654},{"name":2110,"provider":4577,"score":4580,"inference_mode":2654},{"slug":5182,"field":5183,"name":5184,"description":5185,"categories":5186,"model_count":5188,"source":5126,"top_models":5189},"tau2","benchmark_tau2","Tau2","Tau2 benchmark testing multi-turn agent capabilities in airline and retail domains.",[5187],"Multi-turn",214,[5190,5191,5192,5193],{"name":2433,"provider":4066,"score":4859,"inference_mode":3250},{"name":2634,"provider":4066,"score":870,"inference_mode":2654},{"name":2493,"provider":4066,"score":1355,"inference_mode":3250},{"name":2493,"provider":4066,"score":4943,"inference_mode":2654},{"slug":5195,"field":5196,"name":5197,"description":5198,"categories":5199,"model_count":5200,"source":5126,"top_models":5201},"terminalbench","benchmark_terminalbench","TerminalBench","Terminal-based benchmark testing AI ability to interact with command-line interfaces and solve system tasks.",[5187],209,[5202,5203,5204,5205],{"name":2608,"provider":9,"score":5073,"inference_mode":2654},{"name":2521,"provider":138,"score":2483,"inference_mode":2654},{"name":2539,"provider":9,"score":2483,"inference_mode":2654},{"name":2480,"provider":138,"score":4911,"inference_mode":2654},{"slug":5207,"field":5208,"name":5209,"description":5210,"categories":5211,"model_count":5212,"source":5126,"top_models":5213},"livecodebench","benchmark_livecodebench","LiveCodeBench","Real-world coding benchmark with problems from competitive programming contests, testing code generation and problem-solving abilities.",[5150],200,[5214,5215,5216,5217],{"name":2151,"provider":248,"score":2156,"inference_mode":2654},{"name":2367,"provider":248,"score":2155,"inference_mode":3250},{"name":2220,"provider":3115,"score":4691,"inference_mode":2654},{"name":2376,"provider":4066,"score":2382,"inference_mode":3250},{"slug":5219,"field":5220,"name":5221,"description":5222,"categories":5223,"model_count":5212,"source":5126,"top_models":5225},"mmlu-pro","benchmark_mmlu_pro","MMLU-Pro","Massive Multitask Language Understanding benchmark testing knowledge across 57 diverse subjects including STEM, humanities, social sciences, and professional domains.",[5224],"General Knowledge",[5226,5227,5228,5229],{"name":2151,"provider":248,"score":2154,"inference_mode":2654},{"name":2194,"provider":138,"score":2197,"inference_mode":3250},{"name":2367,"provider":248,"score":2372,"inference_mode":3250},{"name":2194,"provider":138,"score":1070,"inference_mode":2654},{"slug":5231,"field":5232,"name":5233,"description":5234,"categories":5235,"model_count":5237,"source":5126,"top_models":5238},"aime-25","benchmark_aime_25","AIME 2025","American Invitational Mathematics Examination 2025 problems testing olympiad-level mathematical reasoning.",[5236],"Mathematical Problem Solving",174,[5239,5240,5241,5242],{"name":2319,"provider":9,"score":1501,"inference_mode":2654},{"name":1858,"provider":9,"score":4213,"inference_mode":2654},{"name":2367,"provider":248,"score":655,"inference_mode":3250},{"name":2220,"provider":3115,"score":1408,"inference_mode":2654},{"slug":5244,"field":5245,"name":5246,"description":5247,"categories":5248,"model_count":5249,"source":5126,"top_models":5250},"math-500","benchmark_math_hard","MATH-500","Competition mathematics problems requiring multi-step reasoning, covering algebra, geometry, number theory, and calculus.",[5236],116,[5251,5252,5253,5254],{"name":1681,"provider":9,"score":4193,"inference_mode":2654},{"name":1162,"provider":9,"score":1168,"inference_mode":2654},{"name":1389,"provider":3823,"score":1168,"inference_mode":2654},{"name":1336,"provider":138,"score":1343,"inference_mode":3250},{"slug":5256,"field":5257,"name":5258,"description":5259,"categories":5260,"model_count":5261,"source":5126,"top_models":5262},"aime","benchmark_aime","AIME 2024","American Invitational Mathematics Examination 2024 problems testing olympiad-level mathematical reasoning.",[5236],115,[5263,5264,5265,5266],{"name":1681,"provider":9,"score":943,"inference_mode":2654},{"name":1496,"provider":3823,"score":1502,"inference_mode":2654},{"name":1150,"provider":9,"score":1158,"inference_mode":2654},{"name":1586,"provider":1833,"score":1158,"inference_mode":3250},{"slug":5268,"field":5269,"name":5270,"description":5271,"categories":5272,"model_count":5273,"source":5274,"top_models":5275},"agieval-en","benchmark_agieval_en","AGIEval English","AGIEval English — human-level reasoning tasks from standardized exams like SAT, LSAT, and civil service exams.",[5124],114,"stratix",[5276,5277,5278,5279],{"name":2527,"provider":248,"score":4996,"inference_mode":2654},{"name":2151,"provider":248,"score":4622,"inference_mode":2654},{"name":2508,"provider":1833,"score":4962,"inference_mode":2654},{"name":2508,"provider":1833,"score":4962,"inference_mode":2654},{"slug":5281,"field":5282,"name":5283,"description":5284,"categories":5285,"model_count":5286,"source":5274,"top_models":5287},"bbh","benchmark_bbh","BBH","Big-Bench Hard — challenging subset of BIG-Bench focusing on tasks where language models previously underperformed.",[5124],109,[5288,5289,5290,5291],{"name":1927,"provider":138,"score":4456,"inference_mode":3250},{"name":1927,"provider":138,"score":4466,"inference_mode":2654},{"name":2493,"provider":4066,"score":4932,"inference_mode":3250},{"name":2493,"provider":4066,"score":4932,"inference_mode":2654},{"slug":5293,"field":5294,"name":5295,"description":5296,"categories":5297,"model_count":4580,"source":5274,"top_models":5298},"humaneval","benchmark_humaneval","HumanEval","OpenAI HumanEval benchmark measuring Python code generation from function docstrings.",[5150],[5299,5300,5301,5302],{"name":1927,"provider":138,"score":4457,"inference_mode":3250},{"name":704,"provider":3115,"score":3129,"inference_mode":2654},{"name":1496,"provider":3823,"score":3952,"inference_mode":2654},{"name":1927,"provider":138,"score":3952,"inference_mode":2654},{"slug":5304,"field":5305,"name":5306,"description":5307,"categories":5308,"model_count":1786,"source":5274,"top_models":5310},"accountingaudit","benchmark_accountingaudit","Accounting Audit","Accounting and audit benchmark testing financial reasoning capabilities.",[5309],"Financial Reasoning",[5311,5312,5313,5314],{"name":884,"provider":138,"score":3255,"inference_mode":3250},{"name":1310,"provider":248,"score":3255,"inference_mode":2654},{"name":884,"provider":138,"score":3190,"inference_mode":2654},{"name":910,"provider":1833,"score":3190,"inference_mode":2654},{"slug":5316,"field":5317,"name":5318,"description":5319,"categories":5320,"model_count":1786,"source":5274,"top_models":5321},"mbppplus","benchmark_mbppplus","MBPP Plus","Mostly Basic Python Problems Plus — tests Python code generation with enhanced test cases.",[5150],[5322,5323,5324,5325],{"name":1179,"provider":1833,"score":3589,"inference_mode":3250},{"name":1179,"provider":1833,"score":3589,"inference_mode":2654},{"name":704,"provider":3115,"score":3132,"inference_mode":2654},{"name":1173,"provider":9,"score":3576,"inference_mode":2654},{"slug":5327,"field":5328,"name":5329,"description":5330,"categories":5331,"model_count":17,"source":5274,"top_models":5333},"mmmu","benchmark_mmmu","MMMU","Multimodal Understanding benchmark testing vision-language models on expert-level tasks.",[5332],"Multimodal",[5334,5335,5336,5337],{"name":1173,"provider":9,"score":3578,"inference_mode":2654},{"name":1681,"provider":9,"score":4200,"inference_mode":2654},{"name":1681,"provider":9,"score":4200,"inference_mode":2654},{"name":1681,"provider":9,"score":4200,"inference_mode":2654},{"slug":5339,"field":5340,"name":5341,"description":5342,"categories":5343,"model_count":3633,"source":5274,"top_models":5344},"swe-bench-lite","benchmark_swe_bench_lite","SWE-bench Lite","Software Engineering benchmark testing ability to resolve real GitHub issues.",[5187],[5345,5346,5347,5348],{"name":2480,"provider":138,"score":4904,"inference_mode":3250},{"name":2480,"provider":138,"score":4904,"inference_mode":2654},{"name":2501,"provider":3889,"score":4953,"inference_mode":2654},{"name":1681,"provider":9,"score":2924,"inference_mode":2654},{"slug":5350,"field":5351,"name":5352,"description":5353,"categories":5354,"model_count":2483,"source":5274,"top_models":5355},"gsm8k","benchmark_gsm8k","GSM8K","Grade School Math 8K — 8,500 high quality grade school math word problems.",[5236],[5356,5357,5358,5359],{"name":1348,"provider":138,"score":3790,"inference_mode":3250},{"name":1348,"provider":138,"score":3790,"inference_mode":2654},{"name":704,"provider":3115,"score":3128,"inference_mode":2654},{"name":1173,"provider":9,"score":3572,"inference_mode":2654},{"slug":5361,"field":5362,"name":5363,"description":5364,"categories":5365,"model_count":4148,"source":5274,"top_models":5366},"simpleqa","benchmark_simpleqa","SimpleQA","Simple question answering benchmark testing factual accuracy and knowledge retrieval.",[5124,5224],[5367,5368,5369,5370],{"name":1403,"provider":248,"score":3864,"inference_mode":2654},{"name":1540,"provider":1833,"score":4021,"inference_mode":2654},{"name":1881,"provider":1833,"score":4406,"inference_mode":2654},{"name":1128,"provider":9,"score":3539,"inference_mode":2654},{"slug":5372,"field":5373,"name":5374,"description":5375,"categories":5376,"model_count":1645,"source":5274,"top_models":5377},"arc-challenge","benchmark_arc_challenge","ARC Challenge","AI2 Reasoning Challenge (Challenge set) — grade-school science questions requiring complex reasoning.",[5124],[5378,5379,5380,5381],{"name":1681,"provider":9,"score":4196,"inference_mode":2654},{"name":1681,"provider":9,"score":4196,"inference_mode":2654},{"name":1681,"provider":9,"score":4196,"inference_mode":2654},{"name":1681,"provider":9,"score":4196,"inference_mode":2654},{"slug":5383,"field":5384,"name":5385,"description":5386,"categories":5387,"model_count":1071,"source":5274,"top_models":5388},"bbeh","benchmark_bbeh","BBEH","Big Bench Extra Hard — even more challenging reasoning tasks pushing the limits of language model capabilities.",[5124],[5389,5390,5391,5392],{"name":1681,"provider":9,"score":4197,"inference_mode":2654},{"name":1681,"provider":9,"score":4197,"inference_mode":2654},{"name":1681,"provider":9,"score":4197,"inference_mode":2654},{"name":1681,"provider":9,"score":4197,"inference_mode":2654},{"slug":5394,"field":5395,"name":5396,"description":5397,"categories":5398,"model_count":4397,"source":5274,"top_models":5399},"arc-easy","benchmark_arc_easy","ARC Easy","AI2 Reasoning Challenge (Easy set) — grade-school science questions.",[5124],[5400,5401,5402,5403],{"name":1348,"provider":138,"score":3787,"inference_mode":3250},{"name":1348,"provider":138,"score":3787,"inference_mode":2654},{"name":1196,"provider":1833,"score":3607,"inference_mode":3250},{"name":1196,"provider":1833,"score":3607,"inference_mode":2654},{"slug":5405,"field":5406,"name":5407,"description":5408,"categories":5409,"model_count":1357,"source":5274,"top_models":5410},"math","benchmark_math","Mathematics","Mathematics benchmark covering algebra, geometry, number theory, and calculus problems.",[5236],[5411,5412,5413,5414],{"name":2480,"provider":138,"score":4903,"inference_mode":3250},{"name":2480,"provider":138,"score":4903,"inference_mode":2654},{"name":1173,"provider":9,"score":3575,"inference_mode":2654},{"name":2493,"provider":4066,"score":4933,"inference_mode":3250},{"slug":5416,"field":5417,"name":5418,"description":5419,"categories":5420,"model_count":1357,"source":5274,"top_models":5421},"medqa","benchmark_medqa","MedQA","Medical question answering benchmark from USMLE-style questions.",[5124],[5422,5423,5424,5425],{"name":1173,"provider":9,"score":3577,"inference_mode":2654},{"name":1403,"provider":248,"score":3863,"inference_mode":2654},{"name":884,"provider":138,"score":3268,"inference_mode":3250},{"name":704,"provider":3115,"score":3133,"inference_mode":2654},{"slug":5427,"field":5428,"name":5429,"description":5430,"categories":5431,"model_count":1357,"source":5274,"top_models":5432},"mmlu","benchmark_mmlu","MMLU","Massive Multitask Language Understanding — tests knowledge across 57 subjects.",[5224],[5433,5434,5435,5436],{"name":2493,"provider":4066,"score":4934,"inference_mode":3250},{"name":2493,"provider":4066,"score":4934,"inference_mode":2654},{"name":1361,"provider":3115,"score":3813,"inference_mode":2654},{"name":1083,"provider":1076,"score":3497,"inference_mode":2654},{"slug":5438,"field":5439,"name":5440,"description":5441,"categories":5442,"model_count":3507,"source":5274,"top_models":5444},"agieval-zh","benchmark_agieval_zh","AGIEval Chinese","AGIEval Chinese — reasoning tasks from Chinese standardized exams (Gaokao, civil service).",[5124,5443],"Multilingual",[5445,5446,5447,5448],{"name":1916,"provider":3115,"score":4430,"inference_mode":3250},{"name":1179,"provider":1833,"score":3585,"inference_mode":3250},{"name":1179,"provider":1833,"score":3585,"inference_mode":2654},{"name":1447,"provider":1448,"score":3931,"inference_mode":2654},{"slug":5450,"field":5451,"name":5452,"description":5453,"categories":5454,"model_count":936,"source":5274,"top_models":5455},"stock-bcs","benchmark_stock_bcs","Stock BCS","Stock market benchmark testing financial analysis capabilities.",[5309],[5456,5457,5458,5459],{"name":408,"provider":1833,"score":2827,"inference_mode":2654},{"name":704,"provider":3115,"score":3136,"inference_mode":2654},{"name":1128,"provider":9,"score":3136,"inference_mode":2654},{"name":762,"provider":9,"score":3190,"inference_mode":2654},{"slug":5461,"field":5462,"name":5463,"description":5464,"categories":5465,"model_count":747,"source":5274,"top_models":5466},"bird-critic","benchmark_bird_critic","BIRD-CRITIC","BIRD-CRITIC — multi-turn benchmark testing SQL generation and database interaction.",[5187],[5467,5468,5469,5470],{"name":2480,"provider":138,"score":1357,"inference_mode":3250},{"name":2480,"provider":138,"score":1357,"inference_mode":2654},{"name":2376,"provider":4066,"score":861,"inference_mode":3250},{"name":2376,"provider":4066,"score":861,"inference_mode":2654},{"slug":5472,"field":5473,"name":5474,"description":5475,"categories":5476,"model_count":174,"source":5274,"top_models":5477},"knights-and-knaves","benchmark_knights_and_knaves","Knights and Knaves","Logic puzzle benchmark based on knights (truth-tellers) and knaves (liars) puzzles.",[5124],[5478,5479,5480,5481],{"name":762,"provider":9,"score":3184,"inference_mode":2654},{"name":1173,"provider":9,"score":3574,"inference_mode":2654},{"name":1361,"provider":3115,"score":3811,"inference_mode":2654},{"name":704,"provider":3115,"score":3130,"inference_mode":2654},{"slug":5483,"field":5484,"name":5485,"description":5486,"categories":5487,"model_count":3506,"source":5274,"top_models":5488},"ifeval","benchmark_ifeval","IFEval","Instruction Following Evaluation benchmark testing how well LLMs follow detailed formatting and content constraints.",[5162],[5489,5490,5491,5492],{"name":2455,"provider":3988,"score":4877,"inference_mode":3250},{"name":2455,"provider":3988,"score":4877,"inference_mode":2654},{"name":1403,"provider":248,"score":3862,"inference_mode":2654},{"name":2376,"provider":4066,"score":3862,"inference_mode":3250},{"slug":5494,"field":5495,"name":5496,"description":5497,"categories":5498,"model_count":995,"source":5274,"top_models":5499},"bfcl-v3","benchmark_bfcl_v3","BFCL v3","Berkeley Function Calling Leaderboard v3 — testing function/tool calling accuracy.",[5187],[5500,5501,5502,5503],{"name":1604,"provider":4066,"score":4087,"inference_mode":3250},{"name":1196,"provider":1833,"score":3609,"inference_mode":3250},{"name":1196,"provider":1833,"score":3609,"inference_mode":2654},{"name":1872,"provider":1833,"score":4388,"inference_mode":2654},{"slug":5505,"field":5506,"name":5507,"description":5508,"categories":5509,"model_count":1243,"source":5274,"top_models":5510},"formal-logic-exp","benchmark_formal_logic_exp","Formal Logic Extended","Extended formal logic benchmark testing deductive and propositional reasoning.",[5124],[5511,5512,5513,5514],{"name":762,"provider":9,"score":3181,"inference_mode":2654},{"name":1361,"provider":3115,"score":1168,"inference_mode":2654},{"name":704,"provider":3115,"score":3127,"inference_mode":2654},{"name":884,"provider":138,"score":3261,"inference_mode":3250},{"slug":5516,"field":5517,"name":5518,"description":5519,"categories":5520,"model_count":2098,"source":5274,"top_models":5521},"wmdp","benchmark_wmdp","WMDP","Weapons of Mass Destruction Proxy — benchmark testing knowledge safety boundaries.",[5124],[5522,5523,5524,5525],{"name":2367,"provider":248,"score":4804,"inference_mode":3250},{"name":2367,"provider":248,"score":4804,"inference_mode":2654},{"name":762,"provider":9,"score":3191,"inference_mode":2654},{"name":884,"provider":138,"score":3273,"inference_mode":3250},{"slug":5527,"field":5528,"name":5529,"description":5530,"categories":5531,"model_count":880,"source":5274,"top_models":5532},"darkbench","benchmark_darkbench","DarkBench","DarkBench — benchmark testing model safety and resistance to adversarial attacks.",[5124],[5533,5534,5535,5536],{"name":1496,"provider":3823,"score":3951,"inference_mode":2654},{"name":684,"provider":3086,"score":3100,"inference_mode":2654},{"name":1196,"provider":1833,"score":3610,"inference_mode":3250},{"name":1196,"provider":1833,"score":3610,"inference_mode":2654},{"slug":5538,"field":5539,"name":5540,"description":5541,"categories":5542,"model_count":880,"source":5274,"top_models":5543},"wmt","benchmark_wmt","WMT 2014","Workshop on Machine Translation 2014 — multilingual translation quality benchmark.",[5443],[5544,5545,5546,5547],{"name":853,"provider":248,"score":3228,"inference_mode":2654},{"name":309,"provider":2706,"score":2767,"inference_mode":2654},{"name":1063,"provider":2706,"score":3474,"inference_mode":2654},{"name":1128,"provider":9,"score":3541,"inference_mode":2654},{"slug":5549,"field":5550,"name":5551,"description":5552,"categories":5553,"model_count":448,"source":5274,"top_models":5554},"gaia","benchmark_gaia","GAIA","GAIA — General AI Assistants benchmark testing multi-step real-world tasks.",[5187],[5555,5556,5557,5558],{"name":1673,"provider":9,"score":4180,"inference_mode":2654},{"name":884,"provider":138,"score":3262,"inference_mode":3250},{"name":884,"provider":138,"score":3262,"inference_mode":2654},{"name":1403,"provider":248,"score":2765,"inference_mode":2654},{"slug":5560,"field":5561,"name":5562,"description":5563,"categories":5564,"model_count":78,"source":5274,"top_models":5565},"multichallenge","benchmark_multichallenge","MultiChallenge","MultiChallenge — general knowledge benchmark with diverse challenge types.",[5224],[5566,5567],{"name":1732,"provider":2665,"score":4260,"inference_mode":2654},{"name":594,"provider":595,"score":3000,"inference_mode":2654},{"benchmark_accountingaudit":5274,"benchmark_agieval_zh":5274,"benchmark_agieval_en":5274,"benchmark_aime":5126,"benchmark_aime_25":5126,"benchmark_arc_challenge":5274,"benchmark_arc_easy":5274,"benchmark_bbeh":5274,"benchmark_bbh":5274,"benchmark_bfcl_v3":5274,"benchmark_bird_critic":5274,"benchmark_darkbench":5274,"benchmark_formal_logic_exp":5274,"benchmark_gaia":5274,"benchmark_gpqa":5126,"benchmark_gsm8k":5274,"benchmark_humaneval":5274,"benchmark_hle":5126,"benchmark_ifbench":5126,"benchmark_ifeval":5274,"benchmark_knights_and_knaves":5274,"benchmark_lcr":5126,"benchmark_livecodebench":5126,"benchmark_math_hard":5126,"benchmark_math":5274,"benchmark_mbppplus":5274,"benchmark_medqa":5274,"benchmark_mmlu":5274,"benchmark_mmlu_pro":5126,"benchmark_mmmu":5274,"benchmark_multichallenge":5274,"benchmark_scicode":5126,"benchmark_simpleqa":5274,"benchmark_stock_bcs":5274,"benchmark_swe_bench_lite":5274,"benchmark_tau2":5126,"benchmark_terminalbench":5126,"benchmark_wmdp":5274,"benchmark_wmt":5274},[5570,5578,5592,5606,5622,5639,5656,5673,5690,5707,5724,5741,5758,5775,5792,5809,5826,5843,5860,5877,5894,5911,5928,5945,5962,5979,5996],{"month":14,"open":5571,"closed":5572},{},{"benchmark_aider":5573,"context_length":5574,"benchmark_mmlu_pro":5575,"benchmark_gpqa":5576,"benchmark_math_hard":5577},{"value":18,"model":8,"provider":9},{"value":24,"model":22,"provider":9},{"value":27,"model":22,"provider":9},{"value":28,"model":22,"provider":9},{"value":30,"model":22,"provider":9},{"month":114,"open":5579,"closed":5586},{"benchmark_mmlu_pro":5580,"benchmark_gpqa":5581,"benchmark_livecodebench":5582,"benchmark_math_hard":5583,"benchmark_aime":5584,"context_length":5585},{"value":118,"model":111,"provider":2665},{"value":119,"model":111,"provider":2665},{"value":2668,"model":111,"provider":2665},{"value":121,"model":111,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":115,"model":111,"provider":2665},{"benchmark_aider":5587,"context_length":5588,"benchmark_mmlu_pro":5589,"benchmark_gpqa":5590,"benchmark_math_hard":5591},{"value":18,"model":8,"provider":9},{"value":24,"model":22,"provider":9},{"value":27,"model":22,"provider":9},{"value":28,"model":22,"provider":9},{"value":30,"model":22,"provider":9},{"month":128,"open":5593,"closed":5600},{"benchmark_mmlu_pro":5594,"benchmark_gpqa":5595,"benchmark_livecodebench":5596,"benchmark_math_hard":5597,"benchmark_aime":5598,"context_length":5599},{"value":130,"model":125,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":133,"model":125,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"benchmark_aider":5601,"context_length":5602,"benchmark_mmlu_pro":5603,"benchmark_gpqa":5604,"benchmark_math_hard":5605},{"value":18,"model":8,"provider":9},{"value":24,"model":22,"provider":9},{"value":27,"model":22,"provider":9},{"value":28,"model":22,"provider":9},{"value":30,"model":22,"provider":9},{"month":141,"open":5607,"closed":5614},{"benchmark_mmlu_pro":5608,"benchmark_gpqa":5609,"benchmark_livecodebench":5610,"benchmark_math_hard":5611,"benchmark_aime":5612,"context_length":5613},{"value":130,"model":125,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":133,"model":125,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"benchmark_aider":5615,"context_length":5616,"benchmark_mmlu_pro":5617,"benchmark_gpqa":5618,"benchmark_math_hard":5619,"benchmark_livecodebench":5620,"benchmark_aime":5621},{"value":18,"model":8,"provider":9},{"value":142,"model":137,"provider":138},{"value":27,"model":22,"provider":9},{"value":145,"model":137,"provider":138},{"value":30,"model":22,"provider":9},{"value":147,"model":137,"provider":138},{"value":61,"model":137,"provider":138},{"month":155,"open":5623,"closed":5631},{"benchmark_mmlu_pro":5624,"benchmark_gpqa":5625,"benchmark_livecodebench":5626,"benchmark_math_hard":5627,"benchmark_aime":5628,"context_length":5629,"benchmark_aider":5630},{"value":197,"model":190,"provider":2706},{"value":198,"model":190,"provider":2706},{"value":200,"model":190,"provider":2706},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"value":199,"model":190,"provider":2706},{"benchmark_aider":5632,"context_length":5633,"benchmark_mmlu_pro":5634,"benchmark_gpqa":5635,"benchmark_math_hard":5636,"benchmark_livecodebench":5637,"benchmark_aime":5638},{"value":18,"model":8,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":145,"model":137,"provider":138},{"value":160,"model":152,"provider":9},{"value":2692,"model":152,"provider":9},{"value":161,"model":152,"provider":9},{"month":219,"open":5640,"closed":5648},{"benchmark_mmlu_pro":5641,"benchmark_gpqa":5642,"benchmark_livecodebench":5643,"benchmark_math_hard":5644,"benchmark_aime":5645,"context_length":5646,"benchmark_aider":5647},{"value":197,"model":190,"provider":2706},{"value":198,"model":190,"provider":2706},{"value":200,"model":190,"provider":2706},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"value":199,"model":190,"provider":2706},{"benchmark_aider":5649,"context_length":5650,"benchmark_mmlu_pro":5651,"benchmark_gpqa":5652,"benchmark_math_hard":5653,"benchmark_livecodebench":5654,"benchmark_aime":5655},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":161,"model":152,"provider":9},{"month":261,"open":5657,"closed":5665},{"benchmark_mmlu_pro":5658,"benchmark_gpqa":5659,"benchmark_livecodebench":5660,"benchmark_math_hard":5661,"benchmark_aime":5662,"context_length":5663,"benchmark_aider":5664},{"value":313,"model":309,"provider":2706},{"value":130,"model":309,"provider":2706},{"value":315,"model":309,"provider":2706},{"value":316,"model":309,"provider":2706},{"value":317,"model":309,"provider":2706},{"value":287,"model":321,"provider":2706},{"value":314,"model":309,"provider":2706},{"benchmark_aider":5666,"context_length":5667,"benchmark_mmlu_pro":5668,"benchmark_gpqa":5669,"benchmark_math_hard":5670,"benchmark_livecodebench":5671,"benchmark_aime":5672},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":161,"model":152,"provider":9},{"month":337,"open":5674,"closed":5682},{"benchmark_mmlu_pro":5675,"benchmark_gpqa":5676,"benchmark_livecodebench":5677,"benchmark_math_hard":5678,"benchmark_aime":5679,"context_length":5680,"benchmark_aider":5681},{"value":313,"model":309,"provider":2706},{"value":130,"model":309,"provider":2706},{"value":315,"model":309,"provider":2706},{"value":316,"model":309,"provider":2706},{"value":317,"model":309,"provider":2706},{"value":287,"model":321,"provider":2706},{"value":314,"model":309,"provider":2706},{"benchmark_aider":5683,"context_length":5684,"benchmark_mmlu_pro":5685,"benchmark_gpqa":5686,"benchmark_math_hard":5687,"benchmark_livecodebench":5688,"benchmark_aime":5689},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":161,"model":152,"provider":9},{"month":403,"open":5691,"closed":5699},{"benchmark_mmlu_pro":5692,"benchmark_gpqa":5693,"benchmark_livecodebench":5694,"benchmark_math_hard":5695,"benchmark_aime":5696,"context_length":5697,"benchmark_aider":5698},{"value":313,"model":309,"provider":2706},{"value":130,"model":309,"provider":2706},{"value":315,"model":309,"provider":2706},{"value":416,"model":408,"provider":1833},{"value":317,"model":309,"provider":2706},{"value":287,"model":321,"provider":2706},{"value":314,"model":309,"provider":2706},{"benchmark_aider":5700,"context_length":5701,"benchmark_mmlu_pro":5702,"benchmark_gpqa":5703,"benchmark_math_hard":5704,"benchmark_livecodebench":5705,"benchmark_aime":5706},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":161,"model":152,"provider":9},{"month":470,"open":5708,"closed":5716},{"benchmark_mmlu_pro":5709,"benchmark_gpqa":5710,"benchmark_livecodebench":5711,"benchmark_math_hard":5712,"benchmark_aime":5713,"context_length":5714,"benchmark_aider":5715},{"value":313,"model":309,"provider":2706},{"value":130,"model":309,"provider":2706},{"value":315,"model":309,"provider":2706},{"value":416,"model":408,"provider":1833},{"value":317,"model":309,"provider":2706},{"value":287,"model":321,"provider":2706},{"value":314,"model":309,"provider":2706},{"benchmark_aider":5717,"context_length":5718,"benchmark_mmlu_pro":5719,"benchmark_gpqa":5720,"benchmark_math_hard":5721,"benchmark_livecodebench":5722,"benchmark_aime":5723},{"value":513,"model":509,"provider":138},{"value":142,"model":137,"provider":138},{"value":511,"model":509,"provider":138},{"value":512,"model":509,"provider":138},{"value":721,"model":216,"provider":9},{"value":514,"model":509,"provider":138},{"value":488,"model":479,"provider":2892},{"month":523,"open":5725,"closed":5733},{"benchmark_mmlu_pro":5726,"benchmark_gpqa":5727,"benchmark_livecodebench":5728,"benchmark_math_hard":5729,"benchmark_aime":5730,"context_length":5731,"benchmark_aider":5732},{"value":313,"model":309,"provider":2706},{"value":130,"model":309,"provider":2706},{"value":315,"model":309,"provider":2706},{"value":416,"model":408,"provider":1833},{"value":317,"model":309,"provider":2706},{"value":287,"model":321,"provider":2706},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5734,"context_length":5735,"benchmark_mmlu_pro":5736,"benchmark_gpqa":5737,"benchmark_math_hard":5738,"benchmark_livecodebench":5739,"benchmark_aime":5740},{"value":513,"model":509,"provider":138},{"value":142,"model":137,"provider":138},{"value":511,"model":509,"provider":138},{"value":512,"model":509,"provider":138},{"value":721,"model":216,"provider":9},{"value":514,"model":509,"provider":138},{"value":488,"model":479,"provider":2892},{"month":598,"open":5742,"closed":5750},{"benchmark_mmlu_pro":5743,"benchmark_gpqa":5744,"benchmark_livecodebench":5745,"benchmark_math_hard":5746,"benchmark_aime":5747,"context_length":5748,"benchmark_aider":5749},{"value":313,"model":309,"provider":2706},{"value":130,"model":309,"provider":2706},{"value":315,"model":309,"provider":2706},{"value":416,"model":408,"provider":1833},{"value":16,"model":630,"provider":2706},{"value":670,"model":666,"provider":667},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5751,"context_length":5752,"benchmark_mmlu_pro":5753,"benchmark_gpqa":5754,"benchmark_math_hard":5755,"benchmark_livecodebench":5756,"benchmark_aime":5757},{"value":513,"model":509,"provider":138},{"value":599,"model":594,"provider":595},{"value":652,"model":649,"provider":9},{"value":653,"model":649,"provider":9},{"value":655,"model":649,"provider":9},{"value":654,"model":649,"provider":9},{"value":656,"model":649,"provider":9},{"month":680,"open":5759,"closed":5767},{"benchmark_mmlu_pro":5760,"benchmark_gpqa":5761,"benchmark_livecodebench":5762,"benchmark_math_hard":5763,"benchmark_aime":5764,"context_length":5765,"benchmark_aider":5766},{"value":721,"model":717,"provider":3115},{"value":3091,"model":684,"provider":3086},{"value":315,"model":309,"provider":2706},{"value":724,"model":717,"provider":3115},{"value":725,"model":717,"provider":3115},{"value":670,"model":666,"provider":667},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5768,"context_length":5769,"benchmark_mmlu_pro":5770,"benchmark_gpqa":5771,"benchmark_math_hard":5772,"benchmark_livecodebench":5773,"benchmark_aime":5774},{"value":513,"model":509,"provider":138},{"value":599,"model":594,"provider":595},{"value":3119,"model":704,"provider":3115},{"value":767,"model":762,"provider":9},{"value":770,"model":762,"provider":9},{"value":769,"model":762,"provider":9},{"value":771,"model":762,"provider":9},{"month":778,"open":5776,"closed":5784},{"benchmark_mmlu_pro":5777,"benchmark_gpqa":5778,"benchmark_livecodebench":5779,"benchmark_math_hard":5780,"benchmark_aime":5781,"context_length":5782,"benchmark_aider":5783},{"value":721,"model":717,"provider":3115},{"value":3091,"model":684,"provider":3086},{"value":315,"model":309,"provider":2706},{"value":724,"model":717,"provider":3115},{"value":725,"model":717,"provider":3115},{"value":670,"model":666,"provider":667},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5785,"context_length":5786,"benchmark_mmlu_pro":5787,"benchmark_gpqa":5788,"benchmark_math_hard":5789,"benchmark_livecodebench":5790,"benchmark_aime":5791},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":3119,"model":704,"provider":3115},{"value":638,"model":865,"provider":9},{"value":870,"model":865,"provider":9},{"value":869,"model":865,"provider":9},{"value":871,"model":865,"provider":9},{"month":913,"open":5793,"closed":5801},{"benchmark_mmlu_pro":5794,"benchmark_gpqa":5795,"benchmark_livecodebench":5796,"benchmark_math_hard":5797,"benchmark_aime":5798,"context_length":5799,"benchmark_aider":5800},{"value":3365,"model":1036,"provider":3115},{"value":1342,"model":1036,"provider":3115},{"value":3302,"model":910,"provider":1833},{"value":943,"model":910,"provider":1833},{"value":1943,"model":910,"provider":1833},{"value":981,"model":978,"provider":385},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5802,"context_length":5803,"benchmark_mmlu_pro":5804,"benchmark_gpqa":5805,"benchmark_math_hard":5806,"benchmark_livecodebench":5807,"benchmark_aime":5808},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":3119,"model":704,"provider":3115},{"value":638,"model":865,"provider":9},{"value":870,"model":865,"provider":9},{"value":869,"model":865,"provider":9},{"value":871,"model":865,"provider":9},{"month":1057,"open":5810,"closed":5818},{"benchmark_mmlu_pro":5811,"benchmark_gpqa":5812,"benchmark_livecodebench":5813,"benchmark_math_hard":5814,"benchmark_aime":5815,"context_length":5816,"benchmark_aider":5817},{"value":1187,"model":1179,"provider":1833},{"value":1188,"model":1179,"provider":1833},{"value":1897,"model":1264,"provider":1833},{"value":1207,"model":1196,"provider":1833},{"value":1190,"model":1179,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5819,"context_length":5820,"benchmark_mmlu_pro":5821,"benchmark_gpqa":5822,"benchmark_math_hard":5823,"benchmark_livecodebench":5824,"benchmark_aime":5825},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":994,"model":1162,"provider":9},{"value":3561,"model":1162,"provider":9},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1158,"model":1150,"provider":9},{"month":1287,"open":5827,"closed":5835},{"benchmark_mmlu_pro":5828,"benchmark_gpqa":5829,"benchmark_livecodebench":5830,"benchmark_math_hard":5831,"benchmark_aime":5832,"context_length":5833,"benchmark_aider":5834},{"value":1187,"model":1179,"provider":1833},{"value":1188,"model":1179,"provider":1833},{"value":1897,"model":1264,"provider":1833},{"value":1207,"model":1196,"provider":1833},{"value":1190,"model":1179,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5836,"context_length":5837,"benchmark_mmlu_pro":5838,"benchmark_gpqa":5839,"benchmark_math_hard":5840,"benchmark_livecodebench":5841,"benchmark_aime":5842},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":905,"model":1348,"provider":138},{"value":3561,"model":1162,"provider":9},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1158,"model":1150,"provider":9},{"month":1374,"open":5844,"closed":5852},{"benchmark_mmlu_pro":5845,"benchmark_gpqa":5846,"benchmark_livecodebench":5847,"benchmark_math_hard":5848,"benchmark_aime":5849,"context_length":5850,"benchmark_aider":5851},{"value":1187,"model":1179,"provider":1833},{"value":3927,"model":1447,"provider":1448},{"value":1108,"model":1424,"provider":3889},{"value":1429,"model":1424,"provider":3889},{"value":1190,"model":1179,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5853,"context_length":5854,"benchmark_mmlu_pro":5855,"benchmark_gpqa":5856,"benchmark_math_hard":5857,"benchmark_livecodebench":5858,"benchmark_aime":5859},{"value":1366,"model":1395,"provider":9},{"value":856,"model":853,"provider":248},{"value":905,"model":1348,"provider":138},{"value":1399,"model":1395,"provider":9},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1158,"model":1150,"provider":9},{"month":1469,"open":5861,"closed":5869},{"benchmark_mmlu_pro":5862,"benchmark_gpqa":5863,"benchmark_livecodebench":5864,"benchmark_math_hard":5865,"benchmark_aime":5866,"context_length":5867,"benchmark_aider":5868},{"value":1112,"model":1521,"provider":3988},{"value":1677,"model":1521,"provider":3988},{"value":994,"model":1521,"provider":3988},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5870,"context_length":5871,"benchmark_mmlu_pro":5872,"benchmark_gpqa":5873,"benchmark_math_hard":5874,"benchmark_livecodebench":5875,"benchmark_aime":5876},{"value":1366,"model":1395,"provider":9},{"value":856,"model":853,"provider":248},{"value":905,"model":1348,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1502,"model":1496,"provider":3823},{"month":1635,"open":5878,"closed":5886},{"benchmark_mmlu_pro":5879,"benchmark_gpqa":5880,"benchmark_livecodebench":5881,"benchmark_math_hard":5882,"benchmark_aime":5883,"context_length":5884,"benchmark_aider":5885},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":4135,"model":1656,"provider":9},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":555,"model":549,"provider":1833},{"benchmark_aider":5887,"context_length":5888,"benchmark_mmlu_pro":5889,"benchmark_gpqa":5890,"benchmark_math_hard":5891,"benchmark_livecodebench":5892,"benchmark_aime":5893},{"value":1643,"model":1681,"provider":9},{"value":856,"model":853,"provider":248},{"value":1643,"model":1640,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":4193,"model":1681,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":943,"model":1681,"provider":9},{"month":1785,"open":5895,"closed":5903},{"benchmark_mmlu_pro":5896,"benchmark_gpqa":5897,"benchmark_livecodebench":5898,"benchmark_math_hard":5899,"benchmark_aime":5900,"context_length":5901,"benchmark_aider":5902},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":4135,"model":1656,"provider":9},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":5904,"context_length":5905,"benchmark_mmlu_pro":5906,"benchmark_gpqa":5907,"benchmark_math_hard":5908,"benchmark_livecodebench":5909,"benchmark_aime":5910},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":1643,"model":1640,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":4193,"model":1681,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":943,"model":1681,"provider":9},{"month":1951,"open":5912,"closed":5920},{"benchmark_mmlu_pro":5913,"benchmark_gpqa":5914,"benchmark_livecodebench":5915,"benchmark_math_hard":5916,"benchmark_aime":5917,"context_length":5918,"benchmark_aider":5919},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":4135,"model":1656,"provider":9},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":5921,"context_length":5922,"benchmark_mmlu_pro":5923,"benchmark_gpqa":5924,"benchmark_math_hard":5925,"benchmark_livecodebench":5926,"benchmark_aime":5927},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":1643,"model":1640,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":4193,"model":1681,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":943,"model":1681,"provider":9},{"month":2105,"open":5929,"closed":5937},{"benchmark_mmlu_pro":5930,"benchmark_gpqa":5931,"benchmark_livecodebench":5932,"benchmark_math_hard":5933,"benchmark_aime":5934,"context_length":5935,"benchmark_aider":5936},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":4135,"model":1656,"provider":9},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":5938,"context_length":5939,"benchmark_mmlu_pro":5940,"benchmark_gpqa":5941,"benchmark_math_hard":5942,"benchmark_livecodebench":5943,"benchmark_aime":5944},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2155,"model":2151,"provider":248},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"month":2214,"open":5946,"closed":5954},{"benchmark_mmlu_pro":5947,"benchmark_gpqa":5948,"benchmark_livecodebench":5949,"benchmark_math_hard":5950,"benchmark_aime":5951,"context_length":5952,"benchmark_aider":5953},{"value":1930,"model":2389,"provider":3889},{"value":1221,"model":2220,"provider":3115},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":5955,"context_length":5956,"benchmark_mmlu_pro":5957,"benchmark_gpqa":5958,"benchmark_math_hard":5959,"benchmark_livecodebench":5960,"benchmark_aime":5961},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2155,"model":2151,"provider":248},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"month":2413,"open":5963,"closed":5971},{"benchmark_mmlu_pro":5964,"benchmark_gpqa":5965,"benchmark_livecodebench":5966,"benchmark_math_hard":5967,"benchmark_aime":5968,"context_length":5969,"benchmark_aider":5970},{"value":1930,"model":2389,"provider":3889},{"value":2460,"model":2455,"provider":3988},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":5972,"context_length":5973,"benchmark_mmlu_pro":5974,"benchmark_gpqa":5975,"benchmark_math_hard":5976,"benchmark_livecodebench":5977,"benchmark_aime":5978},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2155,"model":2151,"provider":248},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"month":2476,"open":5980,"closed":5988},{"benchmark_mmlu_pro":5981,"benchmark_gpqa":5982,"benchmark_livecodebench":5983,"benchmark_math_hard":5984,"benchmark_aime":5985,"context_length":5986,"benchmark_aider":5987},{"value":1930,"model":2389,"provider":3889},{"value":973,"model":2508,"provider":1833},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":5989,"context_length":5990,"benchmark_mmlu_pro":5991,"benchmark_gpqa":5992,"benchmark_math_hard":5993,"benchmark_livecodebench":5994,"benchmark_aime":5995},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2542,"model":2539,"provider":9},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"month":2592,"open":5997,"closed":6005},{"benchmark_mmlu_pro":5998,"benchmark_gpqa":5999,"benchmark_livecodebench":6000,"benchmark_math_hard":6001,"benchmark_aime":6002,"context_length":6003,"benchmark_aider":6004},{"value":1930,"model":2389,"provider":3889},{"value":973,"model":2508,"provider":1833},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":856,"model":1063,"provider":2706},{"value":1793,"model":1916,"provider":3115},{"benchmark_aider":6006,"context_length":6007,"benchmark_mmlu_pro":6008,"benchmark_gpqa":6009,"benchmark_math_hard":6010,"benchmark_livecodebench":6011,"benchmark_aime":6012},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2216,"model":2608,"provider":9},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"months":6014,"countries":6766},[6015,6022,6036,6050,6066,6082,6098,6114,6130,6154,6178,6203,6228,6253,6278,6311,6344,6377,6410,6443,6483,6523,6563,6603,6643,6683,6723],{"month":14,"us":6016},{"benchmark_aider":6017,"context_length":6018,"benchmark_mmlu_pro":6019,"benchmark_gpqa":6020,"benchmark_math_hard":6021},{"value":18,"model":8,"provider":9},{"value":24,"model":22,"provider":9},{"value":27,"model":22,"provider":9},{"value":28,"model":22,"provider":9},{"value":30,"model":22,"provider":9},{"month":114,"us":6023,"fr":6029},{"benchmark_aider":6024,"context_length":6025,"benchmark_mmlu_pro":6026,"benchmark_gpqa":6027,"benchmark_math_hard":6028},{"value":18,"model":8,"provider":9},{"value":24,"model":22,"provider":9},{"value":27,"model":22,"provider":9},{"value":28,"model":22,"provider":9},{"value":30,"model":22,"provider":9},{"benchmark_mmlu_pro":6030,"benchmark_gpqa":6031,"benchmark_livecodebench":6032,"benchmark_math_hard":6033,"benchmark_aime":6034,"context_length":6035},{"value":118,"model":111,"provider":2665},{"value":119,"model":111,"provider":2665},{"value":2668,"model":111,"provider":2665},{"value":121,"model":111,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":115,"model":111,"provider":2665},{"month":128,"us":6037,"fr":6043},{"benchmark_aider":6038,"context_length":6039,"benchmark_mmlu_pro":6040,"benchmark_gpqa":6041,"benchmark_math_hard":6042},{"value":18,"model":8,"provider":9},{"value":24,"model":22,"provider":9},{"value":27,"model":22,"provider":9},{"value":28,"model":22,"provider":9},{"value":30,"model":22,"provider":9},{"benchmark_mmlu_pro":6044,"benchmark_gpqa":6045,"benchmark_livecodebench":6046,"benchmark_math_hard":6047,"benchmark_aime":6048,"context_length":6049},{"value":130,"model":125,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":133,"model":125,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"month":141,"us":6051,"fr":6059},{"benchmark_aider":6052,"context_length":6053,"benchmark_mmlu_pro":6054,"benchmark_gpqa":6055,"benchmark_math_hard":6056,"benchmark_livecodebench":6057,"benchmark_aime":6058},{"value":18,"model":8,"provider":9},{"value":142,"model":137,"provider":138},{"value":27,"model":22,"provider":9},{"value":145,"model":137,"provider":138},{"value":30,"model":22,"provider":9},{"value":147,"model":137,"provider":138},{"value":61,"model":137,"provider":138},{"benchmark_mmlu_pro":6060,"benchmark_gpqa":6061,"benchmark_livecodebench":6062,"benchmark_math_hard":6063,"benchmark_aime":6064,"context_length":6065},{"value":130,"model":125,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":133,"model":125,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"month":155,"us":6067,"fr":6075},{"benchmark_aider":6068,"context_length":6069,"benchmark_mmlu_pro":6070,"benchmark_gpqa":6071,"benchmark_math_hard":6072,"benchmark_livecodebench":6073,"benchmark_aime":6074},{"value":18,"model":8,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":198,"model":190,"provider":2706},{"value":160,"model":152,"provider":9},{"value":2692,"model":152,"provider":9},{"value":161,"model":152,"provider":9},{"benchmark_mmlu_pro":6076,"benchmark_gpqa":6077,"benchmark_livecodebench":6078,"benchmark_math_hard":6079,"benchmark_aime":6080,"context_length":6081},{"value":183,"model":178,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"month":219,"us":6083,"fr":6091},{"benchmark_aider":6084,"context_length":6085,"benchmark_mmlu_pro":6086,"benchmark_gpqa":6087,"benchmark_math_hard":6088,"benchmark_livecodebench":6089,"benchmark_aime":6090},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":2693,"model":152,"provider":9},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":161,"model":152,"provider":9},{"benchmark_mmlu_pro":6092,"benchmark_gpqa":6093,"benchmark_livecodebench":6094,"benchmark_math_hard":6095,"benchmark_aime":6096,"context_length":6097},{"value":183,"model":178,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"month":261,"us":6099,"fr":6107},{"benchmark_aider":6100,"context_length":6101,"benchmark_mmlu_pro":6102,"benchmark_gpqa":6103,"benchmark_math_hard":6104,"benchmark_livecodebench":6105,"benchmark_aime":6106},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":313,"model":309,"provider":2706},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":317,"model":309,"provider":2706},{"benchmark_mmlu_pro":6108,"benchmark_gpqa":6109,"benchmark_livecodebench":6110,"benchmark_math_hard":6111,"benchmark_aime":6112,"context_length":6113},{"value":183,"model":178,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"month":337,"us":6115,"fr":6123},{"benchmark_aider":6116,"context_length":6117,"benchmark_mmlu_pro":6118,"benchmark_gpqa":6119,"benchmark_math_hard":6120,"benchmark_livecodebench":6121,"benchmark_aime":6122},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":313,"model":309,"provider":2706},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":317,"model":309,"provider":2706},{"benchmark_mmlu_pro":6124,"benchmark_gpqa":6125,"benchmark_livecodebench":6126,"benchmark_math_hard":6127,"benchmark_aime":6128,"context_length":6129},{"value":183,"model":178,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"month":403,"us":6131,"fr":6139,"cn":6146},{"benchmark_aider":6132,"context_length":6133,"benchmark_mmlu_pro":6134,"benchmark_gpqa":6135,"benchmark_math_hard":6136,"benchmark_livecodebench":6137,"benchmark_aime":6138},{"value":221,"model":216,"provider":9},{"value":142,"model":137,"provider":138},{"value":313,"model":309,"provider":2706},{"value":2730,"model":216,"provider":9},{"value":721,"model":216,"provider":9},{"value":2096,"model":216,"provider":9},{"value":317,"model":309,"provider":2706},{"benchmark_mmlu_pro":6140,"benchmark_gpqa":6141,"benchmark_livecodebench":6142,"benchmark_math_hard":6143,"benchmark_aime":6144,"context_length":6145},{"value":183,"model":178,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"benchmark_mmlu_pro":6147,"benchmark_gpqa":6148,"benchmark_aider":6149,"benchmark_livecodebench":6150,"benchmark_math_hard":6151,"benchmark_aime":6152,"context_length":6153},{"value":412,"model":408,"provider":1833},{"value":413,"model":408,"provider":1833},{"value":414,"model":408,"provider":1833},{"value":415,"model":408,"provider":1833},{"value":416,"model":408,"provider":1833},{"value":417,"model":408,"provider":1833},{"value":115,"model":408,"provider":1833},{"month":470,"us":6155,"fr":6163,"cn":6170},{"benchmark_aider":6156,"context_length":6157,"benchmark_mmlu_pro":6158,"benchmark_gpqa":6159,"benchmark_math_hard":6160,"benchmark_livecodebench":6161,"benchmark_aime":6162},{"value":513,"model":509,"provider":138},{"value":142,"model":137,"provider":138},{"value":511,"model":509,"provider":138},{"value":512,"model":509,"provider":138},{"value":721,"model":216,"provider":9},{"value":514,"model":509,"provider":138},{"value":488,"model":479,"provider":2892},{"benchmark_mmlu_pro":6164,"benchmark_gpqa":6165,"benchmark_livecodebench":6166,"benchmark_math_hard":6167,"benchmark_aime":6168,"context_length":6169},{"value":183,"model":178,"provider":2665},{"value":2674,"model":125,"provider":2665},{"value":132,"model":125,"provider":2665},{"value":2701,"model":178,"provider":2665},{"value":2667,"model":111,"provider":2665},{"value":129,"model":125,"provider":2665},{"benchmark_mmlu_pro":6171,"benchmark_gpqa":6172,"benchmark_aider":6173,"benchmark_livecodebench":6174,"benchmark_math_hard":6175,"benchmark_aime":6176,"context_length":6177},{"value":412,"model":408,"provider":1833},{"value":413,"model":408,"provider":1833},{"value":414,"model":408,"provider":1833},{"value":415,"model":408,"provider":1833},{"value":416,"model":408,"provider":1833},{"value":417,"model":408,"provider":1833},{"value":115,"model":408,"provider":1833},{"month":523,"us":6179,"fr":6187,"cn":6195},{"benchmark_aider":6180,"context_length":6181,"benchmark_mmlu_pro":6182,"benchmark_gpqa":6183,"benchmark_math_hard":6184,"benchmark_livecodebench":6185,"benchmark_aime":6186},{"value":513,"model":509,"provider":138},{"value":142,"model":137,"provider":138},{"value":511,"model":509,"provider":138},{"value":512,"model":509,"provider":138},{"value":721,"model":216,"provider":9},{"value":514,"model":509,"provider":138},{"value":488,"model":479,"provider":2892},{"benchmark_mmlu_pro":6188,"benchmark_gpqa":6189,"benchmark_livecodebench":6190,"benchmark_math_hard":6191,"benchmark_aime":6192,"context_length":6193,"benchmark_aider":6194},{"value":566,"model":562,"provider":2665},{"value":567,"model":562,"provider":2665},{"value":2973,"model":584,"provider":2665},{"value":590,"model":584,"provider":2665},{"value":448,"model":584,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6196,"benchmark_gpqa":6197,"benchmark_aider":6198,"benchmark_livecodebench":6199,"benchmark_math_hard":6200,"benchmark_aime":6201,"context_length":6202},{"value":412,"model":408,"provider":1833},{"value":413,"model":408,"provider":1833},{"value":555,"model":549,"provider":1833},{"value":556,"model":549,"provider":1833},{"value":416,"model":408,"provider":1833},{"value":417,"model":408,"provider":1833},{"value":115,"model":408,"provider":1833},{"month":598,"us":6204,"fr":6212,"cn":6220},{"benchmark_aider":6205,"context_length":6206,"benchmark_mmlu_pro":6207,"benchmark_gpqa":6208,"benchmark_math_hard":6209,"benchmark_livecodebench":6210,"benchmark_aime":6211},{"value":513,"model":509,"provider":138},{"value":599,"model":594,"provider":595},{"value":652,"model":649,"provider":9},{"value":653,"model":649,"provider":9},{"value":655,"model":649,"provider":9},{"value":654,"model":649,"provider":9},{"value":656,"model":649,"provider":9},{"benchmark_mmlu_pro":6213,"benchmark_gpqa":6214,"benchmark_livecodebench":6215,"benchmark_math_hard":6216,"benchmark_aime":6217,"context_length":6218,"benchmark_aider":6219},{"value":566,"model":562,"provider":2665},{"value":567,"model":562,"provider":2665},{"value":2973,"model":584,"provider":2665},{"value":590,"model":584,"provider":2665},{"value":448,"model":584,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6221,"benchmark_gpqa":6222,"benchmark_aider":6223,"benchmark_livecodebench":6224,"benchmark_math_hard":6225,"benchmark_aime":6226,"context_length":6227},{"value":412,"model":408,"provider":1833},{"value":413,"model":408,"provider":1833},{"value":555,"model":549,"provider":1833},{"value":556,"model":549,"provider":1833},{"value":416,"model":408,"provider":1833},{"value":417,"model":408,"provider":1833},{"value":670,"model":666,"provider":667},{"month":680,"us":6229,"fr":6237,"cn":6245},{"benchmark_aider":6230,"context_length":6231,"benchmark_mmlu_pro":6232,"benchmark_gpqa":6233,"benchmark_math_hard":6234,"benchmark_livecodebench":6235,"benchmark_aime":6236},{"value":513,"model":509,"provider":138},{"value":599,"model":594,"provider":595},{"value":652,"model":649,"provider":9},{"value":767,"model":762,"provider":9},{"value":770,"model":762,"provider":9},{"value":769,"model":762,"provider":9},{"value":771,"model":762,"provider":9},{"benchmark_mmlu_pro":6238,"benchmark_gpqa":6239,"benchmark_livecodebench":6240,"benchmark_math_hard":6241,"benchmark_aime":6242,"context_length":6243,"benchmark_aider":6244},{"value":566,"model":562,"provider":2665},{"value":567,"model":562,"provider":2665},{"value":2973,"model":584,"provider":2665},{"value":590,"model":584,"provider":2665},{"value":448,"model":584,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6246,"benchmark_gpqa":6247,"benchmark_aider":6248,"benchmark_livecodebench":6249,"benchmark_math_hard":6250,"benchmark_aime":6251,"context_length":6252},{"value":3119,"model":704,"provider":3115},{"value":710,"model":704,"provider":3115},{"value":555,"model":549,"provider":1833},{"value":712,"model":704,"provider":3115},{"value":713,"model":704,"provider":3115},{"value":749,"model":741,"provider":3115},{"value":670,"model":666,"provider":667},{"month":778,"us":6254,"fr":6262,"cn":6270},{"benchmark_aider":6255,"context_length":6256,"benchmark_mmlu_pro":6257,"benchmark_gpqa":6258,"benchmark_math_hard":6259,"benchmark_livecodebench":6260,"benchmark_aime":6261},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":652,"model":649,"provider":9},{"value":638,"model":865,"provider":9},{"value":870,"model":865,"provider":9},{"value":869,"model":865,"provider":9},{"value":871,"model":865,"provider":9},{"benchmark_mmlu_pro":6263,"benchmark_gpqa":6264,"benchmark_livecodebench":6265,"benchmark_math_hard":6266,"benchmark_aime":6267,"context_length":6268,"benchmark_aider":6269},{"value":566,"model":562,"provider":2665},{"value":567,"model":562,"provider":2665},{"value":2973,"model":584,"provider":2665},{"value":590,"model":584,"provider":2665},{"value":880,"model":875,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6271,"benchmark_gpqa":6272,"benchmark_aider":6273,"benchmark_livecodebench":6274,"benchmark_math_hard":6275,"benchmark_aime":6276,"context_length":6277},{"value":3119,"model":704,"provider":3115},{"value":710,"model":704,"provider":3115},{"value":555,"model":549,"provider":1833},{"value":712,"model":704,"provider":3115},{"value":713,"model":704,"provider":3115},{"value":749,"model":741,"provider":3115},{"value":670,"model":666,"provider":667},{"month":913,"us":6279,"fr":6287,"cn":6295,"ca":6303},{"benchmark_aider":6280,"context_length":6281,"benchmark_mmlu_pro":6282,"benchmark_gpqa":6283,"benchmark_math_hard":6284,"benchmark_livecodebench":6285,"benchmark_aime":6286},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":652,"model":649,"provider":9},{"value":638,"model":865,"provider":9},{"value":870,"model":865,"provider":9},{"value":869,"model":865,"provider":9},{"value":871,"model":865,"provider":9},{"benchmark_mmlu_pro":6288,"benchmark_gpqa":6289,"benchmark_livecodebench":6290,"benchmark_math_hard":6291,"benchmark_aime":6292,"context_length":6293,"benchmark_aider":6294},{"value":566,"model":562,"provider":2665},{"value":567,"model":562,"provider":2665},{"value":2973,"model":584,"provider":2665},{"value":590,"model":584,"provider":2665},{"value":880,"model":875,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6296,"benchmark_gpqa":6297,"benchmark_aider":6298,"benchmark_livecodebench":6299,"benchmark_math_hard":6300,"benchmark_aime":6301,"context_length":6302},{"value":3119,"model":704,"provider":3115},{"value":710,"model":704,"provider":3115},{"value":555,"model":549,"provider":1833},{"value":3302,"model":910,"provider":1833},{"value":713,"model":704,"provider":3115},{"value":1943,"model":910,"provider":1833},{"value":670,"model":666,"provider":667},{"benchmark_mmlu_pro":6304,"benchmark_gpqa":6305,"benchmark_aider":6306,"benchmark_livecodebench":6307,"benchmark_math_hard":6308,"benchmark_aime":6309,"context_length":6310},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"month":1057,"us":6312,"fr":6320,"cn":6328,"ca":6336},{"benchmark_aider":6313,"context_length":6314,"benchmark_mmlu_pro":6315,"benchmark_gpqa":6316,"benchmark_math_hard":6317,"benchmark_livecodebench":6318,"benchmark_aime":6319},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":994,"model":1162,"provider":9},{"value":3561,"model":1162,"provider":9},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1158,"model":1150,"provider":9},{"benchmark_mmlu_pro":6321,"benchmark_gpqa":6322,"benchmark_livecodebench":6323,"benchmark_math_hard":6324,"benchmark_aime":6325,"context_length":6326,"benchmark_aider":6327},{"value":566,"model":562,"provider":2665},{"value":567,"model":562,"provider":2665},{"value":2973,"model":584,"provider":2665},{"value":590,"model":584,"provider":2665},{"value":880,"model":875,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6329,"benchmark_gpqa":6330,"benchmark_aider":6331,"benchmark_livecodebench":6332,"benchmark_math_hard":6333,"benchmark_aime":6334,"context_length":6335},{"value":3119,"model":704,"provider":3115},{"value":710,"model":704,"provider":3115},{"value":555,"model":549,"provider":1833},{"value":1897,"model":1264,"provider":1833},{"value":713,"model":704,"provider":3115},{"value":1190,"model":1179,"provider":1833},{"value":670,"model":666,"provider":667},{"benchmark_mmlu_pro":6337,"benchmark_gpqa":6338,"benchmark_aider":6339,"benchmark_livecodebench":6340,"benchmark_math_hard":6341,"benchmark_aime":6342,"context_length":6343},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"month":1287,"us":6345,"fr":6353,"cn":6361,"ca":6369},{"benchmark_aider":6346,"context_length":6347,"benchmark_mmlu_pro":6348,"benchmark_gpqa":6349,"benchmark_math_hard":6350,"benchmark_livecodebench":6351,"benchmark_aime":6352},{"value":513,"model":509,"provider":138},{"value":856,"model":853,"provider":248},{"value":905,"model":1348,"provider":138},{"value":3561,"model":1162,"provider":9},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1158,"model":1150,"provider":9},{"benchmark_mmlu_pro":6354,"benchmark_gpqa":6355,"benchmark_livecodebench":6356,"benchmark_math_hard":6357,"benchmark_aime":6358,"context_length":6359,"benchmark_aider":6360},{"value":1322,"model":1319,"provider":2665},{"value":933,"model":1319,"provider":2665},{"value":1201,"model":1319,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6362,"benchmark_gpqa":6363,"benchmark_aider":6364,"benchmark_livecodebench":6365,"benchmark_math_hard":6366,"benchmark_aime":6367,"context_length":6368},{"value":3804,"model":1361,"provider":3115},{"value":1166,"model":1361,"provider":3115},{"value":555,"model":549,"provider":1833},{"value":771,"model":1361,"provider":3115},{"value":1367,"model":1361,"provider":3115},{"value":973,"model":1361,"provider":3115},{"value":670,"model":666,"provider":667},{"benchmark_mmlu_pro":6370,"benchmark_gpqa":6371,"benchmark_aider":6372,"benchmark_livecodebench":6373,"benchmark_math_hard":6374,"benchmark_aime":6375,"context_length":6376},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"month":1374,"us":6378,"fr":6386,"cn":6394,"ca":6402},{"benchmark_aider":6379,"context_length":6380,"benchmark_mmlu_pro":6381,"benchmark_gpqa":6382,"benchmark_math_hard":6383,"benchmark_livecodebench":6384,"benchmark_aime":6385},{"value":1366,"model":1395,"provider":9},{"value":856,"model":853,"provider":248},{"value":905,"model":1348,"provider":138},{"value":1399,"model":1395,"provider":9},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1158,"model":1150,"provider":9},{"benchmark_mmlu_pro":6387,"benchmark_gpqa":6388,"benchmark_livecodebench":6389,"benchmark_math_hard":6390,"benchmark_aime":6391,"context_length":6392,"benchmark_aider":6393},{"value":1322,"model":1319,"provider":2665},{"value":933,"model":1319,"provider":2665},{"value":1201,"model":1319,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6395,"benchmark_gpqa":6396,"benchmark_aider":6397,"benchmark_livecodebench":6398,"benchmark_math_hard":6399,"benchmark_aime":6400,"context_length":6401},{"value":3804,"model":1361,"provider":3115},{"value":1166,"model":1361,"provider":3115},{"value":555,"model":549,"provider":1833},{"value":771,"model":1361,"provider":3115},{"value":1367,"model":1361,"provider":3115},{"value":973,"model":1361,"provider":3115},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6403,"benchmark_gpqa":6404,"benchmark_aider":6405,"benchmark_livecodebench":6406,"benchmark_math_hard":6407,"benchmark_aime":6408,"context_length":6409},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"month":1469,"us":6411,"fr":6419,"cn":6427,"ca":6435},{"benchmark_aider":6412,"context_length":6413,"benchmark_mmlu_pro":6414,"benchmark_gpqa":6415,"benchmark_math_hard":6416,"benchmark_livecodebench":6417,"benchmark_aime":6418},{"value":1366,"model":1395,"provider":9},{"value":856,"model":853,"provider":248},{"value":905,"model":1348,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":1168,"model":1162,"provider":9},{"value":1156,"model":1150,"provider":9},{"value":1502,"model":1496,"provider":3823},{"benchmark_mmlu_pro":6420,"benchmark_gpqa":6421,"benchmark_livecodebench":6422,"benchmark_math_hard":6423,"benchmark_aime":6424,"context_length":6425,"benchmark_aider":6426},{"value":1322,"model":1319,"provider":2665},{"value":933,"model":1319,"provider":2665},{"value":1201,"model":1319,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6428,"benchmark_gpqa":6429,"benchmark_aider":6430,"benchmark_livecodebench":6431,"benchmark_math_hard":6432,"benchmark_aime":6433,"context_length":6434},{"value":3804,"model":1361,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":555,"model":549,"provider":1833},{"value":994,"model":1521,"provider":3988},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6436,"benchmark_gpqa":6437,"benchmark_aider":6438,"benchmark_livecodebench":6439,"benchmark_math_hard":6440,"benchmark_aime":6441,"context_length":6442},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"month":1635,"us":6444,"fr":6452,"cn":6460,"ca":6468,"il":6476},{"benchmark_aider":6445,"context_length":6446,"benchmark_mmlu_pro":6447,"benchmark_gpqa":6448,"benchmark_math_hard":6449,"benchmark_livecodebench":6450,"benchmark_aime":6451},{"value":1643,"model":1681,"provider":9},{"value":856,"model":853,"provider":248},{"value":1643,"model":1640,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":4193,"model":1681,"provider":9},{"value":4135,"model":1656,"provider":9},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6453,"benchmark_gpqa":6454,"benchmark_livecodebench":6455,"benchmark_math_hard":6456,"benchmark_aime":6457,"context_length":6458,"benchmark_aider":6459},{"value":1322,"model":1319,"provider":2665},{"value":1735,"model":1732,"provider":2665},{"value":1239,"model":1732,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6461,"benchmark_gpqa":6462,"benchmark_aider":6463,"benchmark_livecodebench":6464,"benchmark_math_hard":6465,"benchmark_aime":6466,"context_length":6467},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":555,"model":549,"provider":1833},{"value":994,"model":1521,"provider":3988},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6469,"benchmark_gpqa":6470,"benchmark_aider":6471,"benchmark_livecodebench":6472,"benchmark_math_hard":6473,"benchmark_aime":6474,"context_length":6475},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6477,"benchmark_gpqa":6478,"benchmark_livecodebench":6479,"benchmark_math_hard":6480,"benchmark_aime":6481,"context_length":6482},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":1785,"us":6484,"fr":6492,"cn":6500,"ca":6508,"il":6516},{"benchmark_aider":6485,"context_length":6486,"benchmark_mmlu_pro":6487,"benchmark_gpqa":6488,"benchmark_math_hard":6489,"benchmark_livecodebench":6490,"benchmark_aime":6491},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":1643,"model":1640,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":4193,"model":1681,"provider":9},{"value":4135,"model":1656,"provider":9},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6493,"benchmark_gpqa":6494,"benchmark_livecodebench":6495,"benchmark_math_hard":6496,"benchmark_aime":6497,"context_length":6498,"benchmark_aider":6499},{"value":1322,"model":1319,"provider":2665},{"value":1735,"model":1732,"provider":2665},{"value":1239,"model":1732,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6501,"benchmark_gpqa":6502,"benchmark_aider":6503,"benchmark_livecodebench":6504,"benchmark_math_hard":6505,"benchmark_aime":6506,"context_length":6507},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":1793,"model":1916,"provider":3115},{"value":994,"model":1521,"provider":3988},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6509,"benchmark_gpqa":6510,"benchmark_aider":6511,"benchmark_livecodebench":6512,"benchmark_math_hard":6513,"benchmark_aime":6514,"context_length":6515},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6517,"benchmark_gpqa":6518,"benchmark_livecodebench":6519,"benchmark_math_hard":6520,"benchmark_aime":6521,"context_length":6522},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":1951,"us":6524,"fr":6532,"cn":6540,"ca":6548,"il":6556},{"benchmark_aider":6525,"context_length":6526,"benchmark_mmlu_pro":6527,"benchmark_gpqa":6528,"benchmark_math_hard":6529,"benchmark_livecodebench":6530,"benchmark_aime":6531},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":1643,"model":1640,"provider":138},{"value":1500,"model":1496,"provider":3823},{"value":4193,"model":1681,"provider":9},{"value":4135,"model":1656,"provider":9},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6533,"benchmark_gpqa":6534,"benchmark_livecodebench":6535,"benchmark_math_hard":6536,"benchmark_aime":6537,"context_length":6538,"benchmark_aider":6539},{"value":1322,"model":1319,"provider":2665},{"value":1735,"model":1732,"provider":2665},{"value":1239,"model":1732,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6541,"benchmark_gpqa":6542,"benchmark_aider":6543,"benchmark_livecodebench":6544,"benchmark_math_hard":6545,"benchmark_aime":6546,"context_length":6547},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":1793,"model":1916,"provider":3115},{"value":994,"model":1521,"provider":3988},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6549,"benchmark_gpqa":6550,"benchmark_aider":6551,"benchmark_livecodebench":6552,"benchmark_math_hard":6553,"benchmark_aime":6554,"context_length":6555},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6557,"benchmark_gpqa":6558,"benchmark_livecodebench":6559,"benchmark_math_hard":6560,"benchmark_aime":6561,"context_length":6562},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":2105,"us":6564,"fr":6572,"cn":6580,"ca":6588,"il":6596},{"benchmark_aider":6565,"context_length":6566,"benchmark_mmlu_pro":6567,"benchmark_gpqa":6568,"benchmark_math_hard":6569,"benchmark_livecodebench":6570,"benchmark_aime":6571},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2155,"model":2151,"provider":248},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6573,"benchmark_gpqa":6574,"benchmark_livecodebench":6575,"benchmark_math_hard":6576,"benchmark_aime":6577,"context_length":6578,"benchmark_aider":6579},{"value":1322,"model":1319,"provider":2665},{"value":1735,"model":1732,"provider":2665},{"value":1239,"model":1732,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":287,"model":562,"provider":2665},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6581,"benchmark_gpqa":6582,"benchmark_aider":6583,"benchmark_livecodebench":6584,"benchmark_math_hard":6585,"benchmark_aime":6586,"context_length":6587},{"value":1744,"model":1739,"provider":3115},{"value":1677,"model":1521,"provider":3988},{"value":1793,"model":1916,"provider":3115},{"value":994,"model":1521,"provider":3988},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6589,"benchmark_gpqa":6590,"benchmark_aider":6591,"benchmark_livecodebench":6592,"benchmark_math_hard":6593,"benchmark_aime":6594,"context_length":6595},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6597,"benchmark_gpqa":6598,"benchmark_livecodebench":6599,"benchmark_math_hard":6600,"benchmark_aime":6601,"context_length":6602},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":2214,"us":6604,"fr":6612,"cn":6620,"ca":6628,"il":6636},{"benchmark_aider":6605,"context_length":6606,"benchmark_mmlu_pro":6607,"benchmark_gpqa":6608,"benchmark_math_hard":6609,"benchmark_livecodebench":6610,"benchmark_aime":6611},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2155,"model":2151,"provider":248},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6613,"benchmark_gpqa":6614,"benchmark_livecodebench":6615,"benchmark_math_hard":6616,"benchmark_aime":6617,"context_length":6618,"benchmark_aider":6619},{"value":781,"model":2305,"provider":2665},{"value":636,"model":2305,"provider":2665},{"value":4733,"model":2305,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":1477,"model":2234,"provider":83},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6621,"benchmark_gpqa":6622,"benchmark_aider":6623,"benchmark_livecodebench":6624,"benchmark_math_hard":6625,"benchmark_aime":6626,"context_length":6627},{"value":1930,"model":2389,"provider":3889},{"value":1221,"model":2220,"provider":3115},{"value":1793,"model":1916,"provider":3115},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6629,"benchmark_gpqa":6630,"benchmark_aider":6631,"benchmark_livecodebench":6632,"benchmark_math_hard":6633,"benchmark_aime":6634,"context_length":6635},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6637,"benchmark_gpqa":6638,"benchmark_livecodebench":6639,"benchmark_math_hard":6640,"benchmark_aime":6641,"context_length":6642},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":2413,"us":6644,"fr":6652,"cn":6660,"ca":6668,"il":6676},{"benchmark_aider":6645,"context_length":6646,"benchmark_mmlu_pro":6647,"benchmark_gpqa":6648,"benchmark_math_hard":6649,"benchmark_livecodebench":6650,"benchmark_aime":6651},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2155,"model":2151,"provider":248},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6653,"benchmark_gpqa":6654,"benchmark_livecodebench":6655,"benchmark_math_hard":6656,"benchmark_aime":6657,"context_length":6658,"benchmark_aider":6659},{"value":781,"model":2305,"provider":2665},{"value":636,"model":2305,"provider":2665},{"value":4733,"model":2305,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":1477,"model":2234,"provider":83},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6661,"benchmark_gpqa":6662,"benchmark_aider":6663,"benchmark_livecodebench":6664,"benchmark_math_hard":6665,"benchmark_aime":6666,"context_length":6667},{"value":1930,"model":2389,"provider":3889},{"value":2460,"model":2455,"provider":3988},{"value":1793,"model":1916,"provider":3115},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6669,"benchmark_gpqa":6670,"benchmark_aider":6671,"benchmark_livecodebench":6672,"benchmark_math_hard":6673,"benchmark_aime":6674,"context_length":6675},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6677,"benchmark_gpqa":6678,"benchmark_livecodebench":6679,"benchmark_math_hard":6680,"benchmark_aime":6681,"context_length":6682},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":2476,"us":6684,"fr":6692,"cn":6700,"ca":6708,"il":6716},{"benchmark_aider":6685,"context_length":6686,"benchmark_mmlu_pro":6687,"benchmark_gpqa":6688,"benchmark_math_hard":6689,"benchmark_livecodebench":6690,"benchmark_aime":6691},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2542,"model":2539,"provider":9},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6693,"benchmark_gpqa":6694,"benchmark_livecodebench":6695,"benchmark_math_hard":6696,"benchmark_aime":6697,"context_length":6698,"benchmark_aider":6699},{"value":781,"model":2305,"provider":2665},{"value":636,"model":2305,"provider":2665},{"value":4733,"model":2305,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":1477,"model":2234,"provider":83},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6701,"benchmark_gpqa":6702,"benchmark_aider":6703,"benchmark_livecodebench":6704,"benchmark_math_hard":6705,"benchmark_aime":6706,"context_length":6707},{"value":1930,"model":2389,"provider":3889},{"value":973,"model":2508,"provider":1833},{"value":1793,"model":1916,"provider":3115},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6709,"benchmark_gpqa":6710,"benchmark_aider":6711,"benchmark_livecodebench":6712,"benchmark_math_hard":6713,"benchmark_aime":6714,"context_length":6715},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6717,"benchmark_gpqa":6718,"benchmark_livecodebench":6719,"benchmark_math_hard":6720,"benchmark_aime":6721,"context_length":6722},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"month":2592,"us":6724,"fr":6732,"cn":6740,"ca":6748,"il":6756,"ae":6763},{"benchmark_aider":6725,"context_length":6726,"benchmark_mmlu_pro":6727,"benchmark_gpqa":6728,"benchmark_math_hard":6729,"benchmark_livecodebench":6730,"benchmark_aime":6731},{"value":1643,"model":1681,"provider":9},{"value":1842,"model":1839,"provider":3823},{"value":2154,"model":2151,"provider":248},{"value":2216,"model":2608,"provider":9},{"value":4193,"model":1681,"provider":9},{"value":2156,"model":2151,"provider":248},{"value":943,"model":1681,"provider":9},{"benchmark_mmlu_pro":6733,"benchmark_gpqa":6734,"benchmark_livecodebench":6735,"benchmark_math_hard":6736,"benchmark_aime":6737,"context_length":6738,"benchmark_aider":6739},{"value":781,"model":2305,"provider":2665},{"value":636,"model":2305,"provider":2665},{"value":4733,"model":2305,"provider":2665},{"value":1323,"model":1319,"provider":2665},{"value":1324,"model":1319,"provider":2665},{"value":1477,"model":2234,"provider":83},{"value":414,"model":584,"provider":2665},{"benchmark_mmlu_pro":6741,"benchmark_gpqa":6742,"benchmark_aider":6743,"benchmark_livecodebench":6744,"benchmark_math_hard":6745,"benchmark_aime":6746,"context_length":6747},{"value":1930,"model":2389,"provider":3889},{"value":973,"model":2508,"provider":1833},{"value":1793,"model":1916,"provider":3115},{"value":4691,"model":2220,"provider":3115},{"value":1590,"model":1586,"provider":1833},{"value":1158,"model":1586,"provider":1833},{"value":792,"model":1424,"provider":3889},{"benchmark_mmlu_pro":6749,"benchmark_gpqa":6750,"benchmark_aider":6751,"benchmark_livecodebench":6752,"benchmark_math_hard":6753,"benchmark_aime":6754,"context_length":6755},{"value":982,"model":978,"provider":385},{"value":133,"model":978,"provider":385},{"value":558,"model":978,"provider":385},{"value":983,"model":978,"provider":385},{"value":3365,"model":978,"provider":385},{"value":3014,"model":978,"provider":385},{"value":981,"model":978,"provider":385},{"benchmark_mmlu_pro":6757,"benchmark_gpqa":6758,"benchmark_livecodebench":6759,"benchmark_math_hard":6760,"benchmark_aime":6761,"context_length":6762},{"value":4232,"model":1696,"provider":4226},{"value":1071,"model":1696,"provider":4226},{"value":3702,"model":1696,"provider":4226},{"value":17,"model":1696,"provider":4226},{"value":230,"model":1696,"provider":4226},{"value":981,"model":1696,"provider":4226},{"benchmark_gpqa":6764,"context_length":6765},{"value":771,"model":2602,"provider":1277},{"value":129,"model":2602,"provider":1277},[6767,6769,6771,6773,6775,6777],{"code":2653,"label":6768},"United States",{"code":2666,"label":6770},"France",{"code":2817,"label":6772},"China",{"code":3362,"label":6774},"Canada",{"code":4228,"label":6776},"Israel",{"code":5063,"label":6778},"UAE",297,260,{"earliest":14,"latest":2592},1775268368908]