tests: Add tool-calling openai integration tests

ericdallo · ericdallo · commit 8b82bf1411ff · 2025-08-14T18:47:29.000-03:00
diff --git a/docs/protocol.md b/docs/protocol.md
@@ -657,7 +657,7 @@ interface ToolCalledContent {
         /**
          * The content of this output
          */
-        content: string; 
+        text: string; 
     }];
     
     /**
diff --git a/integration-test/entrypoint.clj b/integration-test/entrypoint.clj
@@ -5,7 +5,7 @@
    [llm-mock.server :as llm-mock.server]))
 
 (def namespaces
-  '[integration.initialize-test
+  '[;integration.initialize-test
     integration.chat.openai-test])
 
 (defn timeout [timeout-ms callback]
diff --git a/integration-test/integration/chat/openai_test.clj b/integration-test/integration/chat/openai_test.clj
@@ -3,20 +3,13 @@
    [clojure.test :refer [deftest is testing]]
    [integration.eca :as eca]
    [integration.fixture :as fixture]
+   [integration.helper :refer [match-content] :as h]
    [llm-mock.mocks :as llm.mocks]
    [matcher-combinators.matchers :as m]
    [matcher-combinators.test :refer [match?]]))
 
 (eca/clean-after-test)
 
-(defn match-content [chat-id request-id role content]
-  (is (match?
-       {:chatId chat-id
-        :requestId request-id
-        :role role
-        :content content}
-       (eca/client-awaits-server-notification :chat/contentReceived))))
-
 (deftest simple-text
   (eca/start-process!)
 
@@ -210,3 +203,104 @@
                       {:role "user" :content [{:type "input_text" :text "how are you?"}]}]
               :instructions (m/pred string?)}
              llm.mocks/*last-req-body*))))))
+
+(deftest tool-calling
+  (eca/start-process!)
+
+  (eca/request! (fixture/initialize-request))
+  (eca/notify! (fixture/initialized-notification))
+  (let [chat-id* (atom nil)]
+    (testing "We ask what files LLM see"
+      (llm.mocks/set-case! :tool-calling-0)
+      (let [req-id 0
+            resp (eca/request! (fixture/chat-prompt-request
+                                {:request-id req-id
+                                 :model "gpt-5"
+                                 :message "What files you see?"}))
+            chat-id (reset! chat-id* (:chatId resp))]
+
+        (is (match?
+             {:chatId (m/pred string?)
+              :model "gpt-5"
+              :status "success"}
+             resp))
+
+        (match-content chat-id req-id "user" {:type "text" :text "What files you see?\n"})
+        (match-content chat-id req-id "system" {:type "progress" :state "running" :text "Waiting model"})
+        (match-content chat-id req-id "system" {:type "progress" :state "running" :text "Generating"})
+        (match-content chat-id req-id "assistant" {:type "reasonStarted" :id "123"})
+        (match-content chat-id req-id "assistant" {:type "reasonText" :id "123" :text "I should call tool"})
+        (match-content chat-id req-id "assistant" {:type "reasonText" :id "123" :text " eca_directory_tree"})
+        (match-content chat-id req-id "assistant" {:type "reasonFinished" :id "123"})
+        (match-content chat-id req-id "assistant" {:type "text" :text "I will list files"})
+        (match-content chat-id req-id "assistant" {:type "toolCallPrepare"
+                                                   :origin "native"
+                                                   :id "tool-1"
+                                                   :name "eca_directory_tree"
+                                                   :argumentsText ""
+                                                   :manualApproval false
+                                                   :summary "Listing file tree"})
+        (match-content chat-id req-id "assistant" {:type "toolCallPrepare"
+                                                   :origin "native"
+                                                   :id "tool-1"
+                                                   :name "eca_directory_tree"
+                                                   :argumentsText "{\"pat"
+                                                   :manualApproval false
+                                                   :summary "Listing file tree"})
+        (match-content chat-id req-id "assistant" {:type "toolCallPrepare"
+                                                   :origin "native"
+                                                   :id "tool-1"
+                                                   :name "eca_directory_tree"
+                                                   :argumentsText (str "{\"path\":\"" (h/project-path->canon-path "resources") "\"}")
+                                                   :manualApproval false
+                                                   :summary "Listing file tree"})
+        (match-content chat-id req-id "system" {:type "usage"
+                                                :messageInputTokens 5
+                                                :messageOutputTokens 30
+                                                :sessionTokens 35
+                                                :messageCost (m/pred string?)
+                                                :sessionCost (m/pred string?)})
+        (match-content chat-id req-id "assistant" {:type "toolCallRun"
+                                                   :origin "native"
+                                                   :id "tool-1"
+                                                   :name "eca_directory_tree"
+                                                   :arguments {:path (h/project-path->canon-path "resources")}
+                                                   :manualApproval false
+                                                   :summary "Listing file tree"})
+        (match-content chat-id req-id "assistant" {:type "toolCalled"
+                                                   :origin "native"
+                                                   :id "tool-1"
+                                                   :name "eca_directory_tree"
+                                                   :arguments {:path (h/project-path->canon-path "resources")}
+                                                   :summary "Listing file tree"
+                                                   :error false
+                                                   :outputs [{:type "text" :text (str "[FILE] " (h/project-path->canon-path "resources/file2.md\n")
+                                                                                      "[FILE] " (h/project-path->canon-path "resources/file1.md\n"))}]})
+        (match-content chat-id req-id "assistant" {:type "text" :text "The files I see:\n"})
+        (match-content chat-id req-id "assistant" {:type "text" :text "file1\nfile2\n"})
+        (match-content chat-id req-id "system" {:type "usage"
+                                                :messageInputTokens 5
+                                                :messageOutputTokens 30
+                                                :sessionTokens 70
+                                                :messageCost (m/pred string?)
+                                                :sessionCost (m/pred string?)})
+        (match-content chat-id req-id "system" {:type "progress" :state "finished"})
+        (is (match?
+             {:input [{:role "user" :content [{:type "input_text" :text "What files you see?"}]}
+                      {:type "reasoning"
+                       :id "123"
+                       :summary [{:type "summary_text" :text "I should call tool eca_directory_tree"}]
+                       :encrypted_content "enc-123"}
+                      {:role "assistant" :content [{:type "output_text" :text "I will list files"}]}
+                      {:type "function_call"
+                       :name "eca_directory_tree"
+                       :call_id "tool-1"
+                       :arguments (str "{\"path\":\"" (h/project-path->canon-path "resources") "\"}")}
+                      {:type "function_call_output"
+                       :call_id "tool-1"
+                       :output (str "[FILE] " (h/project-path->canon-path "resources/file2.md\n")
+                                    "[FILE] " (h/project-path->canon-path "resources/file1.md\n\n"))}]
+              :tools (m/embeds
+                      [{:name "eca_directory_tree"}])
+              :instructions (m/pred string?)}
+             llm.mocks/*last-req-body*))))))
diff --git a/integration-test/integration/helper.clj b/integration-test/integration/helper.clj
@@ -2,7 +2,10 @@
   (:require
    [babashka.fs :as fs]
    [clojure.java.io :as io]
-   [clojure.string :as string]))
+   [clojure.string :as string]
+   [clojure.test :refer [is]]
+   [integration.eca :as eca]
+   [matcher-combinators.test :refer [match?]]))
 
 (def windows?
   "Whether is running on MS-Windows."
@@ -18,6 +21,11 @@
       fs/canonicalize
       str))
 
+(defn project-path->canon-path
+  "Returns the canonical name of the root project's SUB-PATH."
+  [sub-path]
+  (.getCanonicalPath (io/file default-root-project-path sub-path)))
+
 (defn escape-uri
   "Escapes enough URI characters for testing purposes and returns it.
 
@@ -34,3 +42,11 @@
     (if *escape-uris?*
       (escape-uri uri)
       uri)))
+
+(defn match-content [chat-id request-id role content]
+  (is (match?
+       {:chatId chat-id
+        :requestId request-id
+        :role role
+        :content content}
+       (eca/client-awaits-server-notification :chat/contentReceived))))
diff --git a/integration-test/llm_mock/openai.clj b/integration-test/llm_mock/openai.clj
@@ -1,6 +1,7 @@
 (ns llm-mock.openai
   (:require
    [cheshire.core :as json]
+   [integration.helper :as h]
    [llm-mock.mocks :as llm.mocks]
    [org.httpkit.server :as hk]))
 
@@ -110,21 +111,90 @@
                          :status "completed"}})
   (hk/close ch))
 
+(defn ^:private tool-calling-0 [ch]
+  (let [body llm.mocks/*last-req-body*
+        second-stage? (some #(= "function_call_output" (:type %)) (:input body))]
+    (if-not second-stage?
+      (let [args-json (json/generate-string {:path (h/project-path->canon-path "resources")})]
+        ;; Reasoning prelude
+        (sse-send! ch "response.output_item.added"
+                   {:type "response.output_item.added"
+                    :item {:type "reasoning" :id "123"}})
+        (sse-send! ch "response.reasoning_summary_text.delta"
+                   {:type "response.reasoning_summary_text.delta"
+                    :item_id "123"
+                    :delta "I should call tool"})
+        (sse-send! ch "response.reasoning_summary_text.delta"
+                   {:type "response.reasoning_summary_text.delta"
+                    :item_id "123"
+                    :delta " eca_directory_tree"})
+        (sse-send! ch "response.output_item.done"
+                   {:type "response.output_item.done"
+                    :item {:type "reasoning"
+                           :id "123"
+                           :encrypted_content "enc-123"}})
+        ;; Short text before tool call
+        (sse-send! ch "response.output_text.delta"
+                   {:type "response.output_text.delta" :delta "I will list files"})
+        ;; Function call announced
+        (sse-send! ch "response.output_item.added"
+                   {:type "response.output_item.added"
+                    :item {:type "function_call"
+                           :id "item-1"
+                           :call_id "tool-1"
+                           :name "eca_directory_tree"
+                           :arguments ""}})
+        ;; Stream arguments in two chunks
+        (sse-send! ch "response.function_call_arguments.delta"
+                   {:type "response.function_call_arguments.delta"
+                    :item_id "item-1"
+                    :delta "{\"pat"})
+        (sse-send! ch "response.function_call_arguments.delta"
+                   {:type "response.function_call_arguments.delta"
+                    :item_id "item-1"
+                    :delta (str "h\":\"" (h/project-path->canon-path "resources") "\"}")})
+        ;; Complete with the function call present so the client triggers tools
+        (sse-send! ch "response.completed"
+                   {:type "response.completed"
+                    :response {:output [{:type "function_call"
+                                         :id "item-1"
+                                         :call_id "tool-1"
+                                         :name "eca_directory_tree"
+                                         :arguments args-json}]
+                               :usage {:input_tokens 5
+                                       :output_tokens 30}
+                               :status "completed"}})
+        (hk/close ch))
+      ;; Second stage: after tool outputs are supplied back to the model
+      (do
+        (sse-send! ch "response.output_text.delta"
+                   {:type "response.output_text.delta" :delta "The files I see:\n"})
+        (sse-send! ch "response.output_text.delta"
+                   {:type "response.output_text.delta" :delta "file1\nfile2\n"})
+        (sse-send! ch "response.completed"
+                   {:type "response.completed"
+                    :response {:output []
+                               :usage {:input_tokens 5
+                                       :output_tokens 30}
+                               :status "completed"}})
+        (hk/close ch)))))
+
 (defn handle-openai-responses [req]
   (llm.mocks/set-last-req-body! (some-> (slurp (:body req))
                                         (json/parse-string true)))
   (hk/as-channel
-    req
-    {:on-open (fn [ch]
+   req
+   {:on-open (fn [ch]
                 ;; initial SSE handshake
-                (hk/send! ch {:status 200
-                              :headers {"Content-Type" "text/event-stream; charset=utf-8"
-                                        "Cache-Control" "no-cache"
-                                        "Connection" "keep-alive"}}
-                          false)
-                (case llm.mocks/*case*
-                  :simple-text-0 (simple-text-0 ch)
-                  :simple-text-1 (simple-text-1 ch)
-                  :simple-text-2 (simple-text-2 ch)
-                  :reasoning-0 (reasoning-0 ch)
-                  :reasoning-1 (reasoning-1 ch)))}))
+               (hk/send! ch {:status 200
+                             :headers {"Content-Type" "text/event-stream; charset=utf-8"
+                                       "Cache-Control" "no-cache"
+                                       "Connection" "keep-alive"}}
+                         false)
+               (case llm.mocks/*case*
+                 :simple-text-0 (simple-text-0 ch)
+                 :simple-text-1 (simple-text-1 ch)
+                 :simple-text-2 (simple-text-2 ch)
+                 :reasoning-0 (reasoning-0 ch)
+                 :reasoning-1 (reasoning-1 ch)
+                 :tool-calling-0 (tool-calling-0 ch)))}))
diff --git a/integration-test/sample-test/resources/file1.md b/integration-test/sample-test/resources/file1.md
@@ -0,0 +1 @@
+Something here
diff --git a/integration-test/sample-test/resources/file2.md b/integration-test/sample-test/resources/file2.md
@@ -0,0 +1 @@
+Other thing here