Skip to content

Commit f3dcf39

Browse files
committed
LLMs: Gemini: update cba
1 parent 06cbef1 commit f3dcf39

File tree

1 file changed

+9
-9
lines changed

1 file changed

+9
-9
lines changed

src/modules/llms/server/gemini/gemini.models.ts

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -163,7 +163,7 @@ const _knownGeminiModels: ({
163163
{ paramId: 'llmVndGeminiCodeExecution' },
164164
{ paramId: 'llmVndGeminiGoogleSearch' },
165165
],
166-
benchmark: { cbaElo: 1501 }, // First model to exceed 1500 Elo on LMArena
166+
benchmark: { cbaElo: 1498 }, // gemini-3-pro (preliminary)
167167
},
168168

169169
// 3.0 Pro Image Preview - Released November 20, 2025
@@ -208,7 +208,7 @@ const _knownGeminiModels: ({
208208
{ paramId: 'llmVndGeminiThinkingBudget', rangeOverride: [128, 32768] /* does not support 0 which would turn thinking off */ },
209209
{ paramId: 'llmVndGeminiGoogleSearch' },
210210
],
211-
benchmark: { cbaElo: 1455 }, // gemini-2.5-pro (updated from CSV)
211+
benchmark: { cbaElo: 1451 }, // gemini-2.5-pro
212212
},
213213
{
214214
hidden: true, // show the final stable version instead
@@ -218,14 +218,14 @@ const _knownGeminiModels: ({
218218
chatPrice: gemini25ProPricing,
219219
interfaces: IF_25,
220220
parameterSpecs: [{ paramId: 'llmVndGeminiThinkingBudget', rangeOverride: [128, 32768] /* does not support 0 which would turn thinking off */ }],
221-
benchmark: { cbaElo: 1467 },
221+
// benchmark: { cbaElo: 1467 }, // commented out, yielding to the final versions
222222
},
223223
{
224224
id: 'models/gemini-2.5-pro-preview-05-06',
225225
isPreview: true,
226226
chatPrice: gemini25ProPricing,
227227
interfaces: IF_25,
228-
benchmark: { cbaElo: 1446 },
228+
// benchmark: { cbaElo: 1446 },
229229
hidden: true, // superseded by 06-05 version
230230
},
231231
{
@@ -234,7 +234,7 @@ const _knownGeminiModels: ({
234234
chatPrice: gemini25ProPricing,
235235
interfaces: IF_25,
236236
// parameterSpecs: [{ paramId: 'llmVndGeminiShowThoughts' }], // Gemini doesn't show thoughts anymore
237-
benchmark: { cbaElo: 1439 },
237+
// benchmark: { cbaElo: 1439 },
238238
hidden: true, // hard-superseded, but keeping this as non-symlink in case Gemini restores it
239239
},
240240

@@ -265,7 +265,7 @@ const _knownGeminiModels: ({
265265
{ paramId: 'llmVndGeminiThinkingBudget' },
266266
{ paramId: 'llmVndGeminiGoogleSearch' },
267267
],
268-
benchmark: { cbaElo: 1424 + 1 }, // FALLBACK-UNTIL-AVAILABLE: models/gemini-2.5-flash-preview-05-20 + 1
268+
benchmark: { cbaElo: 1406 + 2 }, // gemini-2.5-flash-preview-09-2025 - the +2 is to be on top of the non-preview 2.5-flash (1407)
269269
},
270270
{
271271
hidden: true, // yielding to 'models/gemini-2.5-flash-preview-09-2025', which is more recent
@@ -377,7 +377,7 @@ const _knownGeminiModels: ({
377377
{ paramId: 'llmVndGeminiThinkingBudget' },
378378
{ paramId: 'llmVndGeminiGoogleSearch' },
379379
],
380-
benchmark: { cbaElo: 1310 + 1 }, // FALLBACK-UNTIL-AVAILABLE: models/gemini-2.5-flash-lite-preview-06-17 + 1
380+
benchmark: { cbaElo: 1380 }, // gemini-2.5-flash-lite-preview-09-2025 (no-thinking variant)
381381
},
382382
// 2.5 Flash-Lite (Stable) - Released July 2025
383383
{
@@ -497,7 +497,7 @@ const _knownGeminiModels: ({
497497
chatPrice: gemini20FlashPricing,
498498
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_GEM_CodeExecution],
499499
parameterSpecs: [{ paramId: 'llmVndGeminiGoogleSearch' }],
500-
benchmark: { cbaElo: 1355 },
500+
benchmark: { cbaElo: 1360 }, // gemini-2.0-flash-001
501501
},
502502
{
503503
id: 'models/gemini-2.0-flash',
@@ -506,7 +506,7 @@ const _knownGeminiModels: ({
506506
chatPrice: gemini20FlashPricing,
507507
interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json, LLM_IF_GEM_CodeExecution],
508508
parameterSpecs: [{ paramId: 'llmVndGeminiGoogleSearch' }],
509-
benchmark: { cbaElo: 1354 },
509+
benchmark: { cbaElo: 1360 }, // gemini-2.0-flash
510510
},
511511

512512
// 2.0 Flash Lite

0 commit comments

Comments
 (0)