[nongnu] elpa/gptel 66a63e6c82 266/273: gptel-ollama: switch to chat API

emacs-elpa-diffs

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

[nongnu] elpa/gptel 66a63e6c82 266/273: gptel-ollama: switch to chat API

From:	ELPA Syncer
Subject:	[nongnu] elpa/gptel 66a63e6c82 266/273: gptel-ollama: switch to chat API
Date:	Wed, 1 May 2024 10:02:54 -0400 (EDT)

branch: elpa/gptel
commit 66a63e6c825abe33926dccf2f2ef1c49667b200a
Author: Karthik Chikmagalur <karthikchikmagalur@gmail.com>
Commit: Karthik Chikmagalur <karthikchikmagalur@gmail.com>

    gptel-ollama: switch to chat API
    
    * gptel-ollama.el (gptel-curl--parse-stream,
    gptel--parse-response, gptel--request-data, gptel--parse-buffer,
    gptel--ollama-context, gptel--ollama-token-count,
    gptel-make-ollama): Switch to Ollama's chat API from
    the completions API.  This makes interacting with Ollama fully
    stateless, like all the other APIs, and should help significantly
    with issues like #249 and #279.  Support non-streaming responses
    from Ollama in the process.
    
    Remove `gptel--ollama-context` as it is no longer needed.
    
    Add a `gptel--ollama-token-count` for tracking token costs. A UI
    affordance for this is not implemented yet, but is planned.
---
 gptel-ollama.el | 96 +++++++++++++++++++++++++++++++++------------------------
 1 file changed, 56 insertions(+), 40 deletions(-)

diff --git a/gptel-ollama.el b/gptel-ollama.el
index 00b40c9b0e..9ac04ae7c9 100644
--- a/gptel-ollama.el
+++ b/gptel-ollama.el
@@ -34,14 +34,16 @@
                             (:copier nil)
                             (:include gptel-backend)))
 
-(defvar-local gptel--ollama-context nil
-  "Context for ollama conversations.
+(defvar-local gptel--ollama-token-count 0
+  "Token count for ollama conversations.
 
-This variable holds the context array for conversations with
-Ollama models.")
+This variable holds the total token count for conversations with
+Ollama models.
+
+Intended for internal use only.")
 
 (cl-defmethod gptel-curl--parse-stream ((_backend gptel-ollama) info)
-  ";TODO: "
+  "Parse response stream for the Ollama API."
   (when (bobp)
     (re-search-forward "^{")
     (forward-line 0))
@@ -50,63 +52,77 @@ Ollama models.")
         (while (setq content (gptel--json-read))
           (setq pt (point))
           (let ((done (map-elt content :done))
-                (response (map-elt content :response)))
+                (response (map-nested-elt content '(:message :content))))
             (push response content-strs)
             (unless (eq done :json-false)
               (with-current-buffer (plist-get info :buffer)
-                (setq gptel--ollama-context (map-elt content :context)))
+                (cl-incf gptel--ollama-token-count
+                         (+ (or (map-elt content :prompt_eval_count) 0)
+                            (or (map-elt content :eval_count) 0))))
               (goto-char (point-max)))))
       (error (goto-char pt)))
     (apply #'concat (nreverse content-strs))))
 
 (cl-defmethod gptel--parse-response ((_backend gptel-ollama) response info)
-  (when-let ((context (map-elt response :context)))
+  "Parse a one-shot RESPONSE from the Ollama API."
+  (when-let ((context
+              (+ (or (map-elt response :prompt_eval_count) 0)
+                 (or (map-elt response :eval_count) 0))))
     (with-current-buffer (plist-get info :buffer)
-      (setq gptel--ollama-context context)))
-  (map-elt response :response))
+      (cl-incf gptel--ollama-token-count context)))
+  (map-nested-elt response '(:message :content)))
 
 (cl-defmethod gptel--request-data ((_backend gptel-ollama) prompts)
-  "JSON encode PROMPTS for Ollama."
+  "JSON encode PROMPTS for sending to ChatGPT."
   (let ((prompts-plist
          `(:model ,gptel-model
-           ,@prompts
+           :messages [,@prompts]
            :stream ,(or (and gptel-stream gptel-use-curl
-                             (gptel-backend-stream gptel-backend))
-                     :json-false))))
-    (when gptel--ollama-context
-      (plist-put prompts-plist :context gptel--ollama-context))
+                         (gptel-backend-stream gptel-backend))
+                     :json-false)))
+        options-plist)
+    (when gptel-temperature
+      (setq options-plist
+            (plist-put options-plist :temperature
+                       gptel-temperature)))
+    (when gptel-max-tokens
+      (setq options-plist
+            (plist-put options-plist :num_predict
+                       gptel-max-tokens)))
+    (when options-plist
+      (plist-put prompts-plist :options options-plist))
     prompts-plist))
 
-(cl-defmethod gptel--parse-buffer ((_backend gptel-ollama) &optional 
_max-entries)
-  (let ((prompts)
-        (prop (text-property-search-backward
-               'gptel 'response
-               (when (get-char-property (max (point-min) (1- (point)))
-                                        'gptel)
-                 t))))
-    (if (and (prop-match-p prop)
-             (prop-match-value prop))
-        (user-error "No user prompt found!")
-      (setq prompts (list
-                     :system gptel--system-message
-                     :prompt
-                     (if (prop-match-p prop)
-                         (string-trim
-                          (buffer-substring-no-properties 
(prop-match-beginning prop)
-                                                          (prop-match-end 
prop))
-                          (format "[\t\r\n ]*\\(?:%s\\)?[\t\r\n ]*"
-                                  (regexp-quote (gptel-prompt-prefix-string)))
-                          (format "[\t\r\n ]*\\(?:%s\\)?[\t\r\n ]*"
-                                  (regexp-quote 
(gptel-response-prefix-string))))
-                       "")))
-      prompts)))
+(cl-defmethod gptel--parse-buffer ((_backend gptel-ollama) &optional 
max-entries)
+  (let ((prompts) (prop))
+    (while (and
+            (or (not max-entries) (>= max-entries 0))
+            (setq prop (text-property-search-backward
+                        'gptel 'response
+                        (when (get-char-property (max (point-min) (1- (point)))
+                                                 'gptel)
+                          t))))
+      (push (list :role (if (prop-match-value prop) "assistant" "user")
+                  :content
+                  (string-trim
+                   (buffer-substring-no-properties (prop-match-beginning prop)
+                                                   (prop-match-end prop))
+                   (format "[\t\r\n ]*\\(?:%s\\)?[\t\r\n ]*"
+                           (regexp-quote (gptel-prompt-prefix-string)))
+                   (format "[\t\r\n ]*\\(?:%s\\)?[\t\r\n ]*"
+                           (regexp-quote (gptel-response-prefix-string)))))
+            prompts)
+      (and max-entries (cl-decf max-entries)))
+    (cons (list :role "system"
+                :content gptel--system-message)
+          prompts)))
 
 ;;;###autoload
 (cl-defun gptel-make-ollama
     (name &key curl-args header key models stream
           (host "localhost:11434")
           (protocol "http")
-          (endpoint "/api/generate"))
+          (endpoint "/api/chat"))
   "Register an Ollama backend for gptel with NAME.
 
 Keyword arguments:

[Prev in Thread]

Current Thread

[Next in Thread]

[nongnu] elpa/gptel e5f54d1d09 229/273: gptel-anthropic: Modify order of request items, (continued)
- [nongnu] elpa/gptel e5f54d1d09 229/273: gptel-anthropic: Modify order of request items, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel f529457bbe 232/273: gptel: Use visual-line-mode when ediff-ing, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 9eea4be5ed 245/273: gptel-transient: Fix gptel-menu definition bug (#265), ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 6d3e4a99f5 236/273: gptel-transient: Rename additional-directive functions, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 5d069cfca8 243/273: gptel-anthropic: Simplify stream parser, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel b31c9be5e0 238/273: gptel-ollama: Adjust Ollama stream parser for libjansson, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 73a0cc25ba 237/273: gptel-transient: Simplify model selection, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 12e00cbd09 247/273: gptel-transient: No pre-fill when reading from minibuffer, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 5dcbf40066 241/273: gptel: Make model parameters global, ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 567af4d2ee 258/273: gptel-org: Read config from Org properties (#141), ELPA Syncer, 2024/05/01
- [nongnu] elpa/gptel 66a63e6c82 266/273: gptel-ollama: switch to chat API, ELPA Syncer <=
- [nongnu] elpa/gptel a2b16c43b1 268/273: gptel-org: Include org-element-lineage-map with gptel (#294), ELPA Syncer, 2024/05/01

Prev by Date: [nongnu] elpa/gptel 567af4d2ee 258/273: gptel-org: Read config from Org properties (#141)
Next by Date: [nongnu] elpa/gptel a2b16c43b1 268/273: gptel-org: Include org-element-lineage-map with gptel (#294)
Previous by thread: [nongnu] elpa/gptel 567af4d2ee 258/273: gptel-org: Read config from Org properties (#141)
Next by thread: [nongnu] elpa/gptel a2b16c43b1 268/273: gptel-org: Include org-element-lineage-map with gptel (#294)
Index(es):
- Date
- Thread