gptel: Add describe-gptel-model feature

pabl0 · pabl0 · commit 9db68bbc77e4 · 2025-03-15T22:59:39.000+02:00
* gptel.el (gptel--openai-cost-url, gptel--openai-models): Add
:cost-url for OpenAI pricing web page.

* gptel.el (describe-gptel-model): New function to display a
description of a gptel model in *Help* buffer.

* gptel-anthropic.el (gptel--anthropic-cost-url,
gptel--anthropic-models): Add :cost-url for Claude pricing web page.
Add :max-output for maximum output tokens.

* gptel-openai-extras.el (gptel-make-deepseek): Add
:cost-url and :max-output for DeepSeek.

* gptel-transient.el (gptel-menu): Add new subsection "Info"
and a new command "Describe model" (bound to `h') to describe
the current selected model.
diff --git a/gptel-anthropic.el b/gptel-anthropic.el
@@ -468,45 +468,58 @@ files in the context."
 ;;                   (t context-string)))
 ;;         (plist-get (car (last prompts)) :content)))
 
+(defconst gptel--anthropic-cost-url "https://docs.anthropic.com/en/docs/about-claude/models#model-comparison-table"
+  "Web page for current Anthropic model pricing.")
+
 (defconst gptel--anthropic-models
-  '((claude-3-7-sonnet-20250219
+  `((claude-3-7-sonnet-20250219
      :description "Hybrid model capable of standard thinking and extended thinking modes"
      :capabilities (media tool-use cache)
      :mime-types ("image/jpeg" "image/png" "image/gif" "image/webp" "application/pdf")
      :context-window 200
+     :max-output 8192
      :input-cost 3
      :output-cost 15
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2025-02")
     (claude-3-5-sonnet-20241022
      :description "Highest level of intelligence and capability"
      :capabilities (media tool-use cache)
      :mime-types ("image/jpeg" "image/png" "image/gif" "image/webp" "application/pdf")
      :context-window 200
+     :max-output 8192
      :input-cost 3
      :output-cost 15
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2024-04")
     (claude-3-5-sonnet-20240620
      :description "Highest level of intelligence and capability (earlier version)"
      :capabilities (media tool-use cache)
      :mime-types ("image/jpeg" "image/png" "image/gif" "image/webp")
      :context-window 200
+     :max-output 8192
      :input-cost 3
      :output-cost 15
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2024-04")
     (claude-3-5-haiku-20241022
      :description "Intelligence at blazing speeds"
      :capabilities (tool-use cache)
      :context-window 200
+     :max-output 8192
      :input-cost 1.00
      :output-cost 5.00
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2024-07")
     (claude-3-opus-20240229
      :description "Top-level performance, intelligence, fluency, and understanding"
      :capabilities (media tool-use cache)
      :mime-types ("image/jpeg" "image/png" "image/gif" "image/webp")
      :context-window 200
+     :max-output 4096
      :input-cost 15
      :output-cost 75
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2023-08")
     (claude-3-sonnet-20240229
      :description "Balance of intelligence and speed (legacy model)"
@@ -515,13 +528,16 @@ files in the context."
      :context-window 200
      :input-cost 3
      :output-cost 15
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2023-08")
     (claude-3-haiku-20240307
      :description "Fast and most compact model for near-instant responsiveness"
      :capabilities (tool-use cache)
      :context-window 200
+     :max-output 4096
      :input-cost 0.25
      :output-cost 1.25
+     :cost-url ,gptel--anthropic-cost-url
      :cutoff-date "2023-08"))
   "List of available Anthropic models and associated properties.
 Keys:
@@ -534,10 +550,14 @@ Keys:
 
 - `:context-window': the context window size, in thousands of tokens.
 
+- `:max-output': the maximum number of output tokens.
+
 - `:input-cost': the input cost, in US dollars per million tokens.
 
 - `:output-cost': the output cost, in US dollars per million tokens.
 
+- `:cost-url': web page for current model pricing.
+
 - `:cutoff-date': the knowledge cutoff date.
 
 - `:request-params': a plist of additional request parameters to
diff --git a/gptel-gemini.el b/gptel-gemini.el
@@ -313,16 +313,21 @@ files in the context."
                   current))
         (plist-get (car (last prompts)) :parts))))
 
+(defconst gptel--gemini-cost-url "https://ai.google.dev/pricing"
+  "Web page for current Gemini model pricing.")
+
 (defconst gptel--gemini-models
-  '((gemini-1.5-pro-latest
+  `((gemini-1.5-pro-latest
      :description "Google's latest model with enhanced capabilities across various tasks"
      :capabilities (tool-use json media)
      :mime-types ("image/png" "image/jpeg" "image/webp" "image/heic" "image/heif"
                   "application/pdf" "text/plain" "text/csv" "text/html")
      :context-window 2000
+     :max-output 8192
      ;; input & output price is halved for prompts of 128k tokens or less
      :input-cost 2.50
      :output-cost 10
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-05")
     (gemini-2.0-flash-exp
      :description "Next generation features, superior speed, native tool use"
@@ -337,19 +342,23 @@ files in the context."
      :mime-types ("image/png" "image/jpeg" "image/webp" "image/heic" "image/heif"
                   "application/pdf" "text/plain" "text/csv" "text/html")
      :context-window 1000
+     :max-output 8192
      ;; input & output price is halved for prompts of 128k tokens or less
      :input-cost 0.15
      :output-cost 0.60
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-05")
     (gemini-1.5-flash-8b
      :description "High volume and lower intelligence tasks"
      :capabilities (tool-use json media)
      :context-window 1000
+     :max-output 8192
      :mime-types ("image/png" "image/jpeg" "image/webp" "image/heic" "image/heif"
                   "application/pdf" "text/plain" "text/csv" "text/html")
      ;; input & output price is halved for prompts of 128k tokens or less
      :input-cost 0.075
      :output-cost 0.30
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-10")
     (gemini-exp-1206
      :description "Improved coding, reasoning and vision capabilities"
@@ -363,28 +372,33 @@ files in the context."
      :mime-types ("image/png" "image/jpeg" "image/webp" "image/heic" "image/heif"
                   "application/pdf" "text/plain" "text/csv" "text/html")
      :context-window 1000
+     :max-output 8192
      :input-cost 0.10
      :output-cost 0.40
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-08")
     (gemini-2.0-flash-lite-preview-02-05
      :description "Gemini 2.0 Flash model optimized for cost efficiency and low latency"
      :capabilities (json)
      :context-window 1000
      :input-cost 0.075
      :output-cost 0.30
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-08")
     (gemini-2.0-pro-exp-02-05
      :description "Next gen, high speed, multimodal for a diverse variety of tasks"
      :capabilities (tool-use json)
      :context-window 2000
      :input-cost 0.00
      :output-cost 0.00
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-08")
     (gemini-2.0-flash-thinking-exp-01-21
      :description "Next gen, high speed, multimodal for a diverse variety of tasks"
      :capabilities (json)
      :input-cost 0.00
      :output-cost 0.00
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-08")
     (gemini-2.0-flash-exp
      :description "Multi-modal, streaming, tool use 2000 RPM"
@@ -394,6 +408,7 @@ files in the context."
      :context-window 1000
      :input-cost 0.00
      :output-cost 0.00
+     :cost-url ,gptel--gemini-cost-url
      :cutoff-date "2024-08")
     (gemini-2.0-flash-thinking-exp
      :description "DEPRECATED: Please use gemini-2.0-flash-thinking-exp-01-21 instead."
@@ -413,10 +428,14 @@ Keys:
 
 - `:context-window': the context window size, in thousands of tokens.
 
+- `:max-output': maximum number of output tokens.
+
 - `:input-cost': the input cost, in US dollars per million tokens.
 
 - `:output-cost': the output cost, in US dollars per million tokens.
 
+- `:cost-url': web page for current model pricing.
+
 - `:cutoff-date': the knowledge cutoff date.
 
 - `:request-params': a plist of additional request parameters to
diff --git a/gptel-openai-extras.el b/gptel-openai-extras.el
@@ -339,12 +339,16 @@ The Deepseek API requires strictly alternating roles (user/assistant) in message
           (models '((deepseek-reasoner
                      :capabilities (tool reasoning)
                      :context-window 64
+		     :max-output 8192
                      :input-cost 0.55
-                     :output-cost 2.19)
+                     :output-cost 2.19
+		     :cost-url "https://api-docs.deepseek.com/quick_start/pricing/")
                     (deepseek-chat
                      :capabilities (tool)
                      :context-window 64
+		     :max-output 8192
                      :input-cost 0.27
+		     :cost-url "https://api-docs.deepseek.com/quick_start/pricing/"
                      :output-cost 1.10))))
   "Register a DeepSeek backend for gptel with NAME."
   (declare (indent 1))
diff --git a/gptel-transient.el b/gptel-transient.el
@@ -576,6 +576,13 @@ Also format its value in the Transient menu."
     (gptel--infix-context-add-file)
     (gptel--infix-context-remove-all)
     (gptel--suffix-context-buffer)]
+   ["" "Info"
+    ("h" "Describe model"
+     (lambda ()
+       "Describe the current gptel model."
+       (interactive)
+       (describe-gptel-model gptel-backend gptel-model))
+     :transient t)]
    [:pad-keys t
     :if (lambda () (and gptel-use-tools gptel--known-tools))
     "" (:info
diff --git a/gptel.el b/gptel.el