@@ -313,16 +313,21 @@ files in the context."
313
313
current))
314
314
(plist-get (car (last prompts)) :parts ))))
315
315
316
+ (defconst gptel--gemini-cost-url " https://ai.google.dev/pricing"
317
+ " Web page for current Gemini model pricing." )
318
+
316
319
(defconst gptel--gemini-models
317
- ' ((gemini-1.5-pro-latest
320
+ ` ((gemini-1.5-pro-latest
318
321
:description " Google's latest model with enhanced capabilities across various tasks"
319
322
:capabilities (tool-use json media)
320
323
:mime-types (" image/png" " image/jpeg" " image/webp" " image/heic" " image/heif"
321
324
" application/pdf" " text/plain" " text/csv" " text/html" )
322
325
:context-window 2000
326
+ :max-output 8192
323
327
; ; input & output price is halved for prompts of 128k tokens or less
324
328
:input-cost 2.50
325
329
:output-cost 10
330
+ :cost-url , gptel--gemini-cost-url
326
331
:cutoff-date " 2024-05" )
327
332
(gemini-2.0-flash-exp
328
333
:description " Next generation features, superior speed, native tool use"
@@ -337,19 +342,23 @@ files in the context."
337
342
:mime-types (" image/png" " image/jpeg" " image/webp" " image/heic" " image/heif"
338
343
" application/pdf" " text/plain" " text/csv" " text/html" )
339
344
:context-window 1000
345
+ :max-output 8192
340
346
; ; input & output price is halved for prompts of 128k tokens or less
341
347
:input-cost 0.15
342
348
:output-cost 0.60
349
+ :cost-url , gptel--gemini-cost-url
343
350
:cutoff-date " 2024-05" )
344
351
(gemini-1.5-flash-8b
345
352
:description " High volume and lower intelligence tasks"
346
353
:capabilities (tool-use json media)
347
354
:context-window 1000
355
+ :max-output 8192
348
356
:mime-types (" image/png" " image/jpeg" " image/webp" " image/heic" " image/heif"
349
357
" application/pdf" " text/plain" " text/csv" " text/html" )
350
358
; ; input & output price is halved for prompts of 128k tokens or less
351
359
:input-cost 0.075
352
360
:output-cost 0.30
361
+ :cost-url , gptel--gemini-cost-url
353
362
:cutoff-date " 2024-10" )
354
363
(gemini-exp-1206
355
364
:description " Improved coding, reasoning and vision capabilities"
@@ -363,28 +372,33 @@ files in the context."
363
372
:mime-types (" image/png" " image/jpeg" " image/webp" " image/heic" " image/heif"
364
373
" application/pdf" " text/plain" " text/csv" " text/html" )
365
374
:context-window 1000
375
+ :max-output 8192
366
376
:input-cost 0.10
367
377
:output-cost 0.40
378
+ :cost-url , gptel--gemini-cost-url
368
379
:cutoff-date " 2024-08" )
369
380
(gemini-2.0-flash-lite-preview-02-05
370
381
:description " Gemini 2.0 Flash model optimized for cost efficiency and low latency"
371
382
:capabilities (json)
372
383
:context-window 1000
373
384
:input-cost 0.075
374
385
:output-cost 0.30
386
+ :cost-url , gptel--gemini-cost-url
375
387
:cutoff-date " 2024-08" )
376
388
(gemini-2.0-pro-exp-02-05
377
389
:description " Next gen, high speed, multimodal for a diverse variety of tasks"
378
390
:capabilities (tool-use json)
379
391
:context-window 2000
380
392
:input-cost 0.00
381
393
:output-cost 0.00
394
+ :cost-url , gptel--gemini-cost-url
382
395
:cutoff-date " 2024-08" )
383
396
(gemini-2.0-flash-thinking-exp-01-21
384
397
:description " Next gen, high speed, multimodal for a diverse variety of tasks"
385
398
:capabilities (json)
386
399
:input-cost 0.00
387
400
:output-cost 0.00
401
+ :cost-url , gptel--gemini-cost-url
388
402
:cutoff-date " 2024-08" )
389
403
(gemini-2.0-flash-exp
390
404
:description " Multi-modal, streaming, tool use 2000 RPM"
@@ -394,6 +408,7 @@ files in the context."
394
408
:context-window 1000
395
409
:input-cost 0.00
396
410
:output-cost 0.00
411
+ :cost-url , gptel--gemini-cost-url
397
412
:cutoff-date " 2024-08" )
398
413
(gemini-2.0-flash-thinking-exp
399
414
:description " DEPRECATED: Please use gemini-2.0-flash-thinking-exp-01-21 instead."
@@ -413,10 +428,14 @@ Keys:
413
428
414
429
- `:context-window' : the context window size, in thousands of tokens.
415
430
431
+ - `:max-output' : maximum number of output tokens.
432
+
416
433
- `:input-cost' : the input cost, in US dollars per million tokens.
417
434
418
435
- `:output-cost' : the output cost, in US dollars per million tokens.
419
436
437
+ - `:cost-url' : web page for current model pricing.
438
+
420
439
- `:cutoff-date' : the knowledge cutoff date.
421
440
422
441
- `:request-params' : a plist of additional request parameters to
0 commit comments