@@ -163,7 +163,7 @@ const _knownGeminiModels: ({
163163 { paramId : 'llmVndGeminiCodeExecution' } ,
164164 { paramId : 'llmVndGeminiGoogleSearch' } ,
165165 ] ,
166- benchmark : { cbaElo : 1501 } , // First model to exceed 1500 Elo on LMArena
166+ benchmark : { cbaElo : 1498 } , // gemini-3-pro (preliminary)
167167 } ,
168168
169169 // 3.0 Pro Image Preview - Released November 20, 2025
@@ -208,7 +208,7 @@ const _knownGeminiModels: ({
208208 { paramId : 'llmVndGeminiThinkingBudget' , rangeOverride : [ 128 , 32768 ] /* does not support 0 which would turn thinking off */ } ,
209209 { paramId : 'llmVndGeminiGoogleSearch' } ,
210210 ] ,
211- benchmark : { cbaElo : 1455 } , // gemini-2.5-pro (updated from CSV)
211+ benchmark : { cbaElo : 1451 } , // gemini-2.5-pro
212212 } ,
213213 {
214214 hidden : true , // show the final stable version instead
@@ -218,14 +218,14 @@ const _knownGeminiModels: ({
218218 chatPrice : gemini25ProPricing ,
219219 interfaces : IF_25 ,
220220 parameterSpecs : [ { paramId : 'llmVndGeminiThinkingBudget' , rangeOverride : [ 128 , 32768 ] /* does not support 0 which would turn thinking off */ } ] ,
221- benchmark : { cbaElo : 1467 } ,
221+ // benchmark: { cbaElo: 1467 }, // commented out, yielding to the final versions
222222 } ,
223223 {
224224 id : 'models/gemini-2.5-pro-preview-05-06' ,
225225 isPreview : true ,
226226 chatPrice : gemini25ProPricing ,
227227 interfaces : IF_25 ,
228- benchmark : { cbaElo : 1446 } ,
228+ // benchmark: { cbaElo: 1446 },
229229 hidden : true , // superseded by 06-05 version
230230 } ,
231231 {
@@ -234,7 +234,7 @@ const _knownGeminiModels: ({
234234 chatPrice : gemini25ProPricing ,
235235 interfaces : IF_25 ,
236236 // parameterSpecs: [{ paramId: 'llmVndGeminiShowThoughts' }], // Gemini doesn't show thoughts anymore
237- benchmark : { cbaElo : 1439 } ,
237+ // benchmark: { cbaElo: 1439 },
238238 hidden : true , // hard-superseded, but keeping this as non-symlink in case Gemini restores it
239239 } ,
240240
@@ -265,7 +265,7 @@ const _knownGeminiModels: ({
265265 { paramId : 'llmVndGeminiThinkingBudget' } ,
266266 { paramId : 'llmVndGeminiGoogleSearch' } ,
267267 ] ,
268- benchmark : { cbaElo : 1424 + 1 } , // FALLBACK-UNTIL-AVAILABLE: models/ gemini-2.5-flash-preview-05-20 + 1
268+ benchmark : { cbaElo : 1406 + 2 } , // gemini-2.5-flash-preview-09-2025 - the +2 is to be on top of the non-preview 2.5-flash (1407)
269269 } ,
270270 {
271271 hidden : true , // yielding to 'models/gemini-2.5-flash-preview-09-2025', which is more recent
@@ -377,7 +377,7 @@ const _knownGeminiModels: ({
377377 { paramId : 'llmVndGeminiThinkingBudget' } ,
378378 { paramId : 'llmVndGeminiGoogleSearch' } ,
379379 ] ,
380- benchmark : { cbaElo : 1310 + 1 } , // FALLBACK-UNTIL-AVAILABLE: models/ gemini-2.5-flash-lite-preview-06-17 + 1
380+ benchmark : { cbaElo : 1380 } , // gemini-2.5-flash-lite-preview-09-2025 (no-thinking variant)
381381 } ,
382382 // 2.5 Flash-Lite (Stable) - Released July 2025
383383 {
@@ -497,7 +497,7 @@ const _knownGeminiModels: ({
497497 chatPrice : gemini20FlashPricing ,
498498 interfaces : [ LLM_IF_OAI_Chat , LLM_IF_OAI_Vision , LLM_IF_OAI_Fn , LLM_IF_OAI_Json , LLM_IF_GEM_CodeExecution ] ,
499499 parameterSpecs : [ { paramId : 'llmVndGeminiGoogleSearch' } ] ,
500- benchmark : { cbaElo : 1355 } ,
500+ benchmark : { cbaElo : 1360 } , // gemini-2.0-flash-001
501501 } ,
502502 {
503503 id : 'models/gemini-2.0-flash' ,
@@ -506,7 +506,7 @@ const _knownGeminiModels: ({
506506 chatPrice : gemini20FlashPricing ,
507507 interfaces : [ LLM_IF_OAI_Chat , LLM_IF_OAI_Vision , LLM_IF_OAI_Fn , LLM_IF_OAI_Json , LLM_IF_GEM_CodeExecution ] ,
508508 parameterSpecs : [ { paramId : 'llmVndGeminiGoogleSearch' } ] ,
509- benchmark : { cbaElo : 1354 } ,
509+ benchmark : { cbaElo : 1360 } , // gemini-2.0-flash
510510 } ,
511511
512512 // 2.0 Flash Lite
0 commit comments