-
Notifications
You must be signed in to change notification settings - Fork 93
/
Copy pathchatgpt-shell-google.el
438 lines (381 loc) · 20 KB
/
chatgpt-shell-google.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
;;; chatgpt-shell-google.el --- Google-specific logic -*- lexical-binding: t -*-
;; Copyright (C) 2023-2025 Alvaro Ramirez
;; Author: Alvaro Ramirez https://xenodium.com
;; URL: https://github.com/xenodium/chatgpt-shell
;; Package-Requires: ((emacs "28.1") (shell-maker "0.72.1"))
;; This package is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 3, or (at your option)
;; any later version.
;; This package is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
;;; Commentary:
;; Adds Google specifics for `chatgpt-shell'.
;;; Code:
(eval-when-compile
(require 'cl-lib))
(require 'let-alist)
(require 'shell-maker)
(require 'map)
(require 'rx)
(require 'json)
(defvar chatgpt-shell-proxy)
(defcustom chatgpt-shell-google-key nil
"Google API key as a string or a function that loads and returns it."
:type '(choice (function :tag "Function")
(string :tag "String"))
:group 'chatgpt-shell)
(defcustom chatgpt-shell-google-api-url-base "https://generativelanguage.googleapis.com"
"Google API's base URL.
API url = base + path.
If you use Gemini through a proxy service, change the URL base."
:type 'string
:safe #'stringp
:group 'chatgpt-shell)
;; https://ai.google.dev/gemini-api/docs/tokens
;; A token is equivalent to _about_ 4 characters.
(cl-defun chatgpt-shell-google-make-model (&key version short-version path token-width context-window grounding-search)
"Create a Google model.
Set VERSION, SHORT-VERSION, PATH, TOKEN-WIDTH, CONTEXT-WINDOW,
VALIDATE-COMMAND, and GROUNDING-SEARCH handler."
(unless version
(error "Missing mandatory :version param"))
(unless short-version
(error "Missing mandatory :short-version param"))
(unless path
(error "Missing mandatory :path param"))
(unless token-width
(error "Missing mandatory :token-width param for %s" version))
(unless context-window
(error "Missing mandatory :context-window param for %s" version))
`((:version . ,version)
(:short-version . ,short-version)
(:label . "Gemini")
(:provider . "Google")
(:path . ,path)
(:token-width . ,token-width)
(:context-window . ,context-window)
(:grounding-search . ,grounding-search)
(:url-base . chatgpt-shell-google-api-url-base)
(:handler . chatgpt-shell-google--handle-gemini-command)
(:filter . chatgpt-shell-google--extract-gemini-response)
(:payload . chatgpt-shell-google--make-payload)
(:url . chatgpt-shell-google--make-url)
(:headers . chatgpt-shell-google--make-headers)
(:key . chatgpt-shell-google-key)
(:validate-command . chatgpt-shell-google--validate-command)))
(defun chatgpt-shell-google--current-generative-model-p (api-response)
"Determine if model in API-RESPONSE is generative.
It returns non-nil if the model described in API-RESPONSE is current and
supports \"generateContent\".
This is used to filter the list of models returned from
https://generativelanguage.googleapis.com"
(let-alist api-response
(and .supportedGenerationMethods
(not (and .description (string-match-p (rx (or "discontinued" "deprecated")) .description)))
(seq-contains-p .supportedGenerationMethods "generateContent"))))
(defun chatgpt-shell-google--fetch-model-versions ()
"Retrieves the list of generative models from the Google API."
(unless (chatgpt-shell-google-key)
(user-error "Please set your `chatgpt-shell-google-key'"))
(with-current-buffer (url-retrieve-synchronously
(concat chatgpt-shell-google-api-url-base "/v1beta/models?key="
(chatgpt-shell-google-key)))
(goto-char (if (boundp 'url-http-end-of-headers)
url-http-end-of-headers
(error "`url-http-end-of-headers' marker is not defined")))
(if-let* ((parsed-response
(shell-maker--json-parse-string
(buffer-substring-no-properties (point) (point-max)))))
(let-alist parsed-response
(seq-filter #'chatgpt-shell-google--current-generative-model-p .models))
(error "No response from Google"))))
(defun chatgpt-shell-google--parse-model (api-response)
"Parse Google API-RESPONSE and return a `chatgpt-shell' model."
(let-alist api-response
(let* ((model-version (string-remove-prefix "models/" .name))
(model-shortversion (string-remove-prefix "gemini-" model-version))
(model-urlpath (concat "/v1beta/" .name))
;; The api-response descriptor does not stipulate whether grounding is supported.
;; This logic applies a heuristic based on the model name (aka version).
(model-supports-grounding (string-match-p (rx bol (or "gemini-1.5" "gemini-2.0")) model-version)))
(chatgpt-shell-google-make-model :version model-version
:short-version model-shortversion
:grounding-search model-supports-grounding
:path model-urlpath
:token-width 4
:context-window .inputTokenLimit))))
(cl-defun chatgpt-shell-google-load-models (&key override)
"Query Google for the list of Gemini LLM models available.
By default, this package uses a static list of models as returned from
`chatgpt-shell-google-models'. But some users may want to choose from
a fresher set of available models.
This function retrieves data from
https://ai.google.dev/gemini-api/docs/models/gemini. This fn then
appends the models retrieved to the `chatgpt-shell-models' list, unless
a model with the same name is already present.
By default, replace the existing Google models in `chatgpt-shell-models'
with the newly retrieved models. When OVERRIDE is non-nil, which
happens when the function is invoked interactively with a prefix
argument, replace all the Google models with those retrieved."
(interactive (list :override current-prefix-arg))
(let* ((goog-predicate (lambda (model)
(string= (map-elt model :provider) "Google")))
(goog-index (or (cl-position-if goog-predicate chatgpt-shell-models)
(length chatgpt-shell-models))))
(setq chatgpt-shell-models (and (not override)
(cl-remove-if goog-predicate chatgpt-shell-models)))
(let* ((existing-gemini-models
(mapcar (lambda (model) (map-elt model :version))
(cl-remove-if-not goog-predicate chatgpt-shell-models)))
(new-gemini-models
(mapcar #'chatgpt-shell-google--parse-model (chatgpt-shell-google--fetch-model-versions))))
(setq chatgpt-shell-models
(append (seq-take chatgpt-shell-models goog-index)
new-gemini-models
(seq-drop chatgpt-shell-models goog-index)))
(message "Added %d Gemini model(s); kept %d existing Gemini model(s)"
(length new-gemini-models)
(length existing-gemini-models)))))
(defun chatgpt-shell-google-toggle-grounding-with-google-search ()
"Toggle the `:grounding-search' boolean for the currently-selected model.
Google's documentation states that All Gemini 1.5 and 2.0 models support
grounding with Google search, and `:grounding-search' will be t for
those models. For models that support grounding, this package will
include a
(tools .((google_search . ())))
in the request payload for 2.0+ models, or
(tools .((google_search_retrieval . ())))
for 1.5-era models.
But some of the experimental models of those versions may not support
grounding. If `chatgpt-shell' tries to send a tools parameter as above
to a model that does not support grounding, the API returns an error.
And in some cases users may wish to not _use_ grounding in Search, even
though it is available.
In either case, the user can invoke this function to toggle
grounding-in-google-search on the model. This package will send the
tools parameter in subsequent outbound requests to that model, when
grounding is enabled.
Returns the new boolean value of `:grounding-search'."
(interactive)
(when-let* ((current-model (chatgpt-shell--resolved-model))
(is-google (string= (map-elt current-model :provider) "Google"))
(current-grounding-cons (assq :grounding-search current-model)))
(let ((toggled (not (cdr current-grounding-cons))))
(setf (cdr current-grounding-cons) toggled)
(message "Grounding in Google search: %s" (if toggled "ON" "OFF"))
toggled)))
(defun chatgpt-shell-google--get-grounding-in-search-tool-keyword (model)
"Retrieves the keyword for the grounding tool.
This gets set once for each MODEL, based on a heuristic."
(when-let* ((current-model model)
(is-google (string= (map-elt current-model :provider) "Google"))
(version (map-elt current-model :version)))
(if (string-match "1\\.5" version)
"google_search_retrieval"
"google_search")))
(defun chatgpt-shell-google-models ()
"Build a list of Google LLM models available."
;; Context windows have been verified as of 11/26/2024. See
;; https://ai.google.dev/gemini-api/docs/models/gemini.
(list (chatgpt-shell-google-make-model :version "gemini-2.5-pro-exp"
:short-version "2.5-pro-exp"
:path "/v1beta/models/gemini-2.5-pro-exp-03-25"
:token-width 4
:context-window 1048576)
(chatgpt-shell-google-make-model :version "gemini-2.0-pro-exp"
:short-version "2.0-pro-exp"
:path "/v1beta/models/gemini-2.0-pro-exp"
:token-width 4
:context-window 2048576)
(chatgpt-shell-google-make-model :version "gemini-2.0-flash-thinking-exp"
:short-version "2.0-flash-thinking-exp"
:path "/v1beta/models/gemini-2.0-flash-thinking-exp"
:token-width 4
:context-window 1048576)
(chatgpt-shell-google-make-model :version "gemini-2.0-flash"
:short-version "2.0-flash"
:path "/v1beta/models/gemini-2.0-flash"
:grounding-search t
:token-width 4
:context-window 1048576)
(chatgpt-shell-google-make-model :version "gemini-1.5-pro-latest"
:short-version "1.5-pro-latest"
:path "/v1beta/models/gemini-1.5-pro-latest"
:token-width 4
:context-window 2097152)
(chatgpt-shell-google-make-model :version "gemini-1.5-flash-latest"
:short-version "1.5-flash-latest"
:path "/v1beta/models/gemini-1.5-flash-latest"
:token-width 4
:context-window 1048576)))
(defun chatgpt-shell-google--validate-command (_command _model _settings)
"Return error string if command/setup isn't valid."
(unless chatgpt-shell-google-key
"Variable `chatgpt-shell-google-key' needs to be set to your key.
Try M-x set-variable chatgpt-shell-google-key
or
(setq chatgpt-shell-google-key \"my-key\")"))
(defun chatgpt-shell-google-key ()
"Get the Google API key."
(cond ((stringp chatgpt-shell-google-key)
chatgpt-shell-google-key)
((functionp chatgpt-shell-google-key)
(condition-case _err
(funcall chatgpt-shell-google-key)
(error
"KEY-NOT-FOUND")))
(t
nil)))
(cl-defun chatgpt-shell-google--make-url (&key _command model settings)
"Create the API URL using MODEL and SETTINGS."
(unless model
(error "Missing mandatory :model param"))
(unless settings
(error "Missing mandatory :settings param"))
(concat chatgpt-shell-google-api-url-base
(or (map-elt model :path)
(error "Provider :path not found"))
(if (map-elt settings :streaming)
":streamGenerateContent"
":generateContent")
"?key="
(or (chatgpt-shell-google-key)
(error "Your chatgpt-shell-google-key is missing"))
"&alt=sse")) ;; Needed or streaming doesn't work.
(cl-defun chatgpt-shell-google--make-headers (&key _model _settings)
"Create the API headers."
(list "Content-Type: application/json; charset=utf-8"))
(cl-defun chatgpt-shell-google--make-payload (&key model context settings)
"Create the API payload using MODEL CONTEXT and SETTINGS."
(chatgpt-shell-google--make-gemini-payload
:context context
:model model
:settings settings))
(cl-defun chatgpt-shell-google--handle-gemini-command (&key model command context shell settings)
"Handle Gemini COMMAND (prompt) using MODEL, CONTEXT, SHELL, and SETTINGS."
(shell-maker-make-http-request
:async t
:url (chatgpt-shell-google--make-url :model model
:settings settings)
:proxy chatgpt-shell-proxy
:data (chatgpt-shell-google--make-gemini-payload
:prompt command
:context context
:model model
:settings settings)
:headers (list "Content-Type: application/json; charset=utf-8")
:filter #'chatgpt-shell-google--extract-gemini-response
:shell shell))
(cl-defun chatgpt-shell-google--make-gemini-payload (&key prompt context settings model)
"Create the request payload.
Compose using PROMPT, CONTEXT, SETTINGS and MODEL."
(append
(when (map-elt settings :system-prompt)
`((system_instruction . ((parts . ((text . ,(map-elt settings :system-prompt))))))))
`((contents . ,(vconcat
(chatgpt-shell-google--gemini-user-model-messages
(append context
(when prompt
(list (cons prompt nil))))))))
(when (map-elt model :grounding-search)
;; Grounding in Google Search is supported for both Gemini 1.5 and 2.0 models.
;; But the API is slightly different between them. This uses the correct tool name.
`((tools . ((,(intern (chatgpt-shell-google--get-grounding-in-search-tool-keyword model)) . ())))))
`((generation_config . ((temperature . ,(or (map-elt settings :temperature) 1))
;; 1 is most diverse output.
(topP . 1))))))
(defun chatgpt-shell-google--gemini-user-model-messages (context)
"Convert CONTEXT to gemini messages.
Sequence must be a vector for json serialization.
For example:
[
((role . \"user\") (parts . ((text . \"hello\"))))
((role . \"model\") (parts . ((text . \"world\"))))
]"
(let ((result))
(mapc
(lambda (item)
(when (car item)
(push (list (cons 'role "user")
(cons 'parts (vconcat ;; Vector for json
(list (list (cons 'text (car item))))))) result))
(when (cdr item)
(push (list (cons 'role "model")
(cons 'parts (vconcat ;; Vector for json
(list (list (cons 'text (cdr item))))))) result)))
context)
(nreverse result)))
(defun chatgpt-shell-google--extract-gemini-response (raw-response)
"Extract Gemini response from RAW-RESPONSE."
(if-let* ((whole (shell-maker--json-parse-string raw-response))
(response (or (let-alist whole
.error.message)
(let-alist whole
(mapconcat (lambda (choice)
(let-alist choice
(or .delta.content
.message.content)))
.choices "")))))
response
(if-let ((chunks (shell-maker--split-text raw-response)))
(let ((response)
(pending)
(result))
(mapc (lambda (chunk)
;; Response chunks come in the form:
;; data: {...}
;; data: {...}
(if-let* ((is-data (equal (map-elt chunk :key) "data:"))
(obj (shell-maker--json-parse-string (map-elt chunk :value)))
(text (let-alist obj
(or (let-alist (seq-first .candidates)
(cond ((seq-first .content.parts)
(let-alist (seq-first .content.parts)
.text))
((equal .finishReason "RECITATION")
"")
((equal .finishReason "STOP")
"")
((equal .finishReason "CANCELLED")
"Error: Request cancellled.")
((equal .finishReason "CRASHED")
"Error: An error occurred. Try again.")
((equal .finishReason "END_OF_PROMPT")
"Error: Couldn't generate a response. Try rephrasing.")
((equal .finishReason "LENGTH")
"Error: Response is too big. Try rephrasing.")
((equal .finishReason "TIME")
"Error: Timed out.")
((equal .finishReason "SAFETY")
"Error: Flagged for safety.")
((equal .finishReason "LANGUAGE")
"Error: Flagged for language.")
((equal .finishReason "BLOCKLIST")
"Error: Flagged for forbidden terms.")
((equal .finishReason "PROHIBITED_CONTENT")
"Error: Flagged for prohibited content.")
((equal .finishReason "SPII")
"Error: Flagged for sensitive personally identifiable information.")
(.finishReason
(format "\n\nError: Something's up (%s)" .finishReason))))
.error.message))))
(unless (string-empty-p text)
(setq response (concat response text)))
(setq pending (concat pending
(or (map-elt chunk :key) "")
(map-elt chunk :value)))))
chunks)
(setq result
(list (cons :filtered (unless (string-empty-p response)
response))
(cons :pending pending)))
result)
(list (cons :filtered nil)
(cons :pending raw-response)))))
(provide 'chatgpt-shell-google)
;;; chatgpt-shell-google.el ends here