mongodb-js
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 1 deletion b/‎.gitignore‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎scripts/update-accuracy-run-status.ts‎
Lines changed: 3 additions & 7 deletions b/‎scripts/update-accuracy-run-status.ts‎
Lines changed: 3 additions & 7 deletions
diff --git a/‎tests/accuracy/aggregate.test.ts‎
Lines changed: 7 additions & 19 deletions b/‎tests/accuracy/aggregate.test.ts‎
Lines changed: 7 additions & 19 deletions
diff --git a/‎tests/accuracy/collection-indexes.test.ts‎
Lines changed: 8 additions & 12 deletions b/‎tests/accuracy/collection-indexes.test.ts‎
Lines changed: 8 additions & 12 deletions
diff --git a/‎tests/accuracy/collection-schema.test.ts‎
Lines changed: 5 additions & 9 deletions b/‎tests/accuracy/collection-schema.test.ts‎
Lines changed: 5 additions & 9 deletions
diff --git a/‎tests/accuracy/collection-storage-size.test.ts‎
Lines changed: 13 additions & 22 deletions b/‎tests/accuracy/collection-storage-size.test.ts‎
Lines changed: 13 additions & 22 deletions
diff --git a/‎tests/accuracy/count.test.ts‎
Lines changed: 15 additions & 21 deletions b/‎tests/accuracy/count.test.ts‎
Lines changed: 15 additions & 21 deletions
diff --git a/‎tests/accuracy/create-collection.test.ts‎
Lines changed: 21 additions & 27 deletions b/‎tests/accuracy/create-collection.test.ts‎
Lines changed: 21 additions & 27 deletions
diff --git a/‎tests/accuracy/create-index.test.ts‎
Lines changed: 12 additions & 16 deletions b/‎tests/accuracy/create-index.test.ts‎
Lines changed: 12 additions & 16 deletions
diff --git a/‎tests/accuracy/db-stats.test.ts‎
Lines changed: 2 additions & 8 deletions b/‎tests/accuracy/db-stats.test.ts‎
Lines changed: 2 additions & 8 deletions
@@ -11,4 +11,5 @@ state.json
 
 tests/tmp
 coverage
-.accuracy-snapshots
+# Generated assets by accuracy runs
+.accuracy
@@ -1,22 +1,18 @@
 import { getAccuracySnapshotStorage } from "../tests/accuracy/sdk/accuracy-snapshot-storage/get-snapshot-storage.js";
-import {
-    AccuracyRunStatus,
-    AccuracyRunStatuses,
-} from "../tests/accuracy/sdk/accuracy-snapshot-storage/snapshot-storage.js";
+import { AccuracyRunStatus } from "../tests/accuracy/sdk/accuracy-snapshot-storage/snapshot-storage.js";
 
 const envAccuracyRunId = process.env.MDB_ACCURACY_RUN_ID;
 const envAccuracyRunStatus = process.env.MDB_ACCURACY_RUN_STATUS;
 
-let status: AccuracyRunStatuses | undefined;
 if (
     !envAccuracyRunId ||
     (envAccuracyRunStatus !== AccuracyRunStatus.Done && envAccuracyRunStatus !== AccuracyRunStatus.Failed)
 ) {
     process.exit(1);
 }
 
-console.time(`Marked accuracy run id - ${envAccuracyRunId} as ${status} in`);
+console.time(`Marked accuracy run id - ${envAccuracyRunId} as ${envAccuracyRunStatus} in`);
 const storage = await getAccuracySnapshotStorage();
 await storage.updateAccuracyRunStatus(envAccuracyRunId, envAccuracyRunStatus);
 await storage.close();
-console.timeEnd(`Marked accuracy run id - ${envAccuracyRunId} as ${status} in`);
+console.timeEnd(`Marked accuracy run id - ${envAccuracyRunId} as ${envAccuracyRunStatus} in`);
@@ -1,28 +1,16 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
-import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 
-function callsAggregate(prompt: string, pipeline: Record<string, unknown>[]): AccuracyTestConfig {
-    return {
-        injectConnectedAssumption: true,
-        prompt: prompt,
-        mockedTools: {},
+describeAccuracyTests(getAvailableModels(), [
+    {
+        prompt: "Group all the movies in 'mflix.movies' namespace by 'release_year' and give me a count of them",
         expectedToolCalls: [
             {
                 toolName: "aggregate",
                 parameters: {
-                    pipeline: pipeline,
+                    pipeline: { $group: { _id: "$release_year", count: { $sum: 1 } } },
                 },
             },
         ],
-    };
-}
-
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should call 'aggregate' tool", [
-        callsAggregate(
-            "Group all the movies in 'mflix.movies' namespace by 'release_year' and give me a count of them",
-            [{ $group: { _id: "$release_year", count: { $sum: 1 } } }]
-        ),
-    ]),
-});
+    },
+]);
@@ -1,12 +1,10 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
 import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 
 function callsCollectionIndexes(prompt: string): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "collection-indexes",
@@ -19,12 +17,10 @@ function callsCollectionIndexes(prompt: string): AccuracyTestConfig {
     };
 }
 
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should call 'collection-indexes' tool", [
-        callsCollectionIndexes("How many indexes do I have in 'mflix.movies' namespace?"),
-        callsCollectionIndexes("List all the indexes in movies collection in mflix database"),
-        callsCollectionIndexes(
-            `Is the following query: ${JSON.stringify({ runtime: { $lt: 100 } })} on the namespace 'mflix.movies' indexed?`
-        ),
-    ]),
-});
+describeAccuracyTests(getAvailableModels(), [
+    callsCollectionIndexes("How many indexes do I have in 'mflix.movies' namespace?"),
+    callsCollectionIndexes("List all the indexes in movies collection in mflix database"),
+    callsCollectionIndexes(
+        `Is the following query: ${JSON.stringify({ runtime: { $lt: 100 } })} on the namespace 'mflix.movies' indexed?`
+    ),
+]);
@@ -1,12 +1,10 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
 import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 
 function callsCollectionSchema(prompt: string): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "collection-schema",
@@ -19,9 +17,7 @@ function callsCollectionSchema(prompt: string): AccuracyTestConfig {
     };
 }
 
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should call 'collection-schema' tool", [
-        callsCollectionSchema("Is there a title field in 'db1.coll1' namespace?"),
-        callsCollectionSchema("What is the type of value stored in title field in coll1 collection in db1 database?"),
-    ]),
-});
+describeAccuracyTests(getAvailableModels(), [
+    callsCollectionSchema("Is there a title field in 'db1.coll1' namespace?"),
+    callsCollectionSchema("What is the type of value stored in title field in coll1 collection in db1 database?"),
+]);
@@ -1,31 +1,22 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
-import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
-import { ExpectedToolCall } from "./sdk/accuracy-snapshot-storage/snapshot-storage.js";
 
-function callsCollectionStorageSize(prompt: string, expectedToolCalls: ExpectedToolCall[]): AccuracyTestConfig {
-    return {
-        injectConnectedAssumption: true,
-        prompt: prompt,
-        mockedTools: {},
-        expectedToolCalls: expectedToolCalls,
-    };
-}
-
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should only call 'collection-storage-size' tool", [
-        callsCollectionStorageSize("What is the size of 'mflix.movies' namespace", [
+describeAccuracyTests(getAvailableModels(), [
+    {
+        prompt: "What is the size of 'mflix.movies' namespace",
+        expectedToolCalls: [
             {
                 toolName: "collection-storage-size",
                 parameters: {
                     database: "mflix",
                     collection: "movies",
                 },
             },
-        ]),
-    ]),
-    ...describeSuite("should call 'collection-storage-size' tool after another tool/s", [
-        callsCollectionStorageSize("How much size is each collection in comics database", [
+        ],
+    },
+    {
+        prompt: "How much size is each collection in comics database",
+        expectedToolCalls: [
             {
                 toolName: "list-collections",
                 parameters: {
@@ -46,6 +37,6 @@ describeAccuracyTests(getAvailableModels(), {
                     collection: "characters",
                 },
             },
-        ]),
-    ]),
-});
+        ],
+    },
+]);
@@ -1,12 +1,10 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
 import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 
 function callsCountToolWithEmptyQuery(prompt: string, database = "mflix", collection = "movies"): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "count",
@@ -26,9 +24,7 @@ function callsCountToolWithQuery(
     query: Record<string, unknown> = {}
 ): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "count",
@@ -42,19 +38,17 @@ function callsCountToolWithQuery(
     };
 }
 
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should only call 'count' tool", [
-        callsCountToolWithEmptyQuery("Count number of documents in 'mflix.movies' namespace."),
-        callsCountToolWithEmptyQuery(
-            "How many documents are there in 'characters' collection in 'comics' database?",
-            "comics",
-            "characters"
-        ),
-        callsCountToolWithQuery(
-            "Count all the documents in 'mflix.movies' namespace with runtime less than 100?",
-            "mflix",
-            "movies",
-            { runtime: { $lt: 100 } }
-        ),
-    ]),
-});
+describeAccuracyTests(getAvailableModels(), [
+    callsCountToolWithEmptyQuery("Count number of documents in 'mflix.movies' namespace."),
+    callsCountToolWithEmptyQuery(
+        "How many documents are there in 'characters' collection in 'comics' database?",
+        "comics",
+        "characters"
+    ),
+    callsCountToolWithQuery(
+        "Count all the documents in 'mflix.movies' namespace with runtime less than 100?",
+        "mflix",
+        "movies",
+        { runtime: { $lt: 100 } }
+    ),
+]);
@@ -1,13 +1,11 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
 import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 import { ExpectedToolCall } from "./sdk/accuracy-snapshot-storage/snapshot-storage.js";
 
 function callsCreateCollection(prompt: string, database: string, collection: string): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "create-collection",
@@ -29,29 +27,25 @@ function callsCreateCollectionWithListCollections(prompt: string, expectedToolCa
     };
 }
 
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should only call 'create-collection' tool", [
-        callsCreateCollection("Create a new namespace 'mflix.documentaries'", "mflix", "documentaries"),
-        callsCreateCollection("Create a new collection villains in comics database", "comics", "villains"),
-    ]),
-    ...describeSuite("should call 'create-collection' alongside other required tools", [
-        callsCreateCollectionWithListCollections(
-            "If and only if, the namespace 'mflix.documentaries' does not exist, then create it",
-            [
-                {
-                    toolName: "list-collections",
-                    parameters: {
-                        database: "mflix",
-                    },
+describeAccuracyTests(getAvailableModels(), [
+    callsCreateCollection("Create a new namespace 'mflix.documentaries'", "mflix", "documentaries"),
+    callsCreateCollection("Create a new collection villains in comics database", "comics", "villains"),
+    callsCreateCollectionWithListCollections(
+        "If and only if, the namespace 'mflix.documentaries' does not exist, then create it",
+        [
+            {
+                toolName: "list-collections",
+                parameters: {
+                    database: "mflix",
                 },
-                {
-                    toolName: "create-collection",
-                    parameters: {
-                        database: "mflix",
-                        collection: "documentaries",
-                    },
+            },
+            {
+                toolName: "create-collection",
+                parameters: {
+                    database: "mflix",
+                    collection: "documentaries",
                 },
-            ]
-        ),
-    ]),
-});
+            },
+        ]
+    ),
+]);
@@ -1,12 +1,10 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
 import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 
 function callsCreateIndex(prompt: string, indexKeys: Record<string, unknown>): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "create-index",
@@ -20,16 +18,14 @@ function callsCreateIndex(prompt: string, indexKeys: Record<string, unknown>): A
     };
 }
 
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should call 'create-index' tool", [
-        callsCreateIndex(
-            "Create an index that covers the following query on 'mflix.movies' namespace - { \"release_year\": 1992 }",
-            {
-                release_year: 1,
-            }
-        ),
-        callsCreateIndex("Create a text index on title field in 'mflix.movies' namespace", {
-            title: "text",
-        }),
-    ]),
-});
+describeAccuracyTests(getAvailableModels(), [
+    callsCreateIndex(
+        "Create an index that covers the following query on 'mflix.movies' namespace - { \"release_year\": 1992 }",
+        {
+            release_year: 1,
+        }
+    ),
+    callsCreateIndex("Create a text index on title field in 'mflix.movies' namespace", {
+        title: "text",
+    }),
+]);
@@ -1,12 +1,10 @@
-import { describeAccuracyTests, describeSuite } from "./sdk/describe-accuracy-tests.js";
+import { describeAccuracyTests } from "./sdk/describe-accuracy-tests.js";
 import { getAvailableModels } from "./sdk/models.js";
 import { AccuracyTestConfig } from "./sdk/describe-accuracy-tests.js";
 
 function callsListDatabases(prompt: string, database = "mflix"): AccuracyTestConfig {
     return {
-        injectConnectedAssumption: true,
         prompt: prompt,
-        mockedTools: {},
         expectedToolCalls: [
             {
                 toolName: "db-stats",
@@ -18,8 +16,4 @@ function callsListDatabases(prompt: string, database = "mflix"): AccuracyTestCon
     };
 }
 
-describeAccuracyTests(getAvailableModels(), {
-    ...describeSuite("should only call 'db-stats' tool", [
-        callsListDatabases("What is the size occupied by database mflix?"),
-    ]),
-});
+describeAccuracyTests(getAvailableModels(), [callsListDatabases("What is the size occupied by database mflix?")]);