Fix AI ext openai streaming (#8553)

jaclarke · web-flow · commit ba703a245502 · 2025-04-08T19:43:50.000+01:00
Should fix issue reported on discord: https://discord.com/channels/841451783728529451/1356441709856292914/1356625059585986722 When translating the openai response (https://platform.openai.com/docs/api-reference/chat-streaming/streaming) to the anthropic style streaming response (https://docs.anthropic.com/en/api/messages-streaming#event-types), we're not sending a `content_block_start` event before the `content_block_delta` events for the text response as required. Also the default prompt doesn't contain a user message, so the user's query never actually gets sent to the llm, just the system message with the context.
diff --git a/edb/buildmeta.py b/edb/buildmeta.py
@@ -57,7 +57,7 @@
 # The merge conflict there is a nice reminder that you probably need
 # to write a patch in edb/pgsql/patches.py, and then you should preserve
 # the old value.
-EDGEDB_CATALOG_VERSION = 2025_04_07_00_00
+EDGEDB_CATALOG_VERSION = 2025_04_08_19_20
 EDGEDB_MAJOR_VERSION = 7
 
 
diff --git a/edb/lib/ext/ai.edgeql b/edb/lib/ext/ai.edgeql
@@ -656,6 +656,13 @@ CREATE EXTENSION PACKAGE ai VERSION '1.0' {
                      knowledge, answer the user query."
                 ),
             }),
+            (insert ext::ai::ChatPromptMessage {
+                participant_role := ext::ai::ChatParticipantRole.User,
+                content := (
+                    "Query: {query}\n\
+                     Answer: "
+                ),
+            })
         }
     };
 
diff --git a/edb/server/protocol/ai_ext.py b/edb/server/protocol/ai_ext.py
@@ -1421,13 +1421,28 @@ async def _start_openai_like_chat(
                             + b'data: ' + event_data + b'\n\n'
                         )
                         protocol.write_raw(event)
+
+                        event_data = json.dumps({
+                            "type": "content_block_start",
+                            "index": 0,
+                            "content_block": {
+                                "type": "text",
+                                "text": ""
+                            }
+                        }).encode("utf-8")
+                        event = (
+                            b'event: content_block_start\n'
+                            + b'data: ' + event_data + b'\n\n'
+                        )
+                        protocol.write_raw(event)
+
                         # if there's only one openai tool call it shows up here
                         if tool_calls:
                             for tool_call in tool_calls:
                                 tool_index = tool_call["index"]
                                 event_data = json.dumps({
                                     "type": "content_block_start",
-                                    "index": tool_call["index"],
+                                    "index": tool_call["index"] + 1,
                                     "content_block": {
                                         "id": tool_call["id"],
                                         "type": "tool_use",
@@ -1458,14 +1473,14 @@ async def _start_openai_like_chat(
                                         + b'data: { \
                                         "type": "content_block_stop",'
                                         + b'"index": '
-                                        + str(currentIndex - 1).encode()
+                                        + str(currentIndex).encode()
                                         + b'}\n\n'
                                     )
                                     protocol.write_raw(event)
 
                                 event_data = json.dumps({
                                     "type": "content_block_start",
-                                    "index": currentIndex,
+                                    "index": currentIndex + 1,
                                     "content_block": {
                                         "id": tool_call.get("id"),
                                         "type": "tool_use",
@@ -1483,7 +1498,7 @@ async def _start_openai_like_chat(
                             else:
                                 event_data = json.dumps({
                                         "type": "content_block_delta",
-                                        "index": currentIndex,
+                                        "index": currentIndex + 1,
                                         "delta": {
                                             "type": "tool_call_delta",
                                             "args":
@@ -1497,7 +1512,9 @@ async def _start_openai_like_chat(
                                 protocol.write_raw(event)
                     elif finish_reason := data.get("finish_reason"):
                         index = (
-                            tool_index if finish_reason == "tool_calls" else 0
+                            tool_index + 1
+                            if finish_reason == "tool_calls"
+                            else 0
                         )
                         event = (
                             b'event: content_block_stop\n'