botpress
diff --git a/‎.github/workflows/vai.yml‎
Lines changed: 40 additions & 0 deletions b/‎.github/workflows/vai.yml‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎.github/workflows/wasm.yml‎
Lines changed: 37 additions & 0 deletions b/‎.github/workflows/wasm.yml‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎.github/workflows/zai.yml‎
Lines changed: 40 additions & 0 deletions b/‎.github/workflows/zai.yml‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎.vscode/settings.json‎
Lines changed: 3 additions & 0 deletions b/‎.vscode/settings.json‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎vai/.npmignore‎
Lines changed: 7 additions & 0 deletions b/‎vai/.npmignore‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎vai/README.md‎
Lines changed: 163 additions & 0 deletions b/‎vai/README.md‎
Lines changed: 163 additions & 0 deletions
diff --git a/‎vai/ensure-env.cjs‎
Lines changed: 9 additions & 0 deletions b/‎vai/ensure-env.cjs‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎vai/package.json‎
Lines changed: 46 additions & 0 deletions b/‎vai/package.json‎
Lines changed: 46 additions & 0 deletions
@@ -0,0 +1,40 @@
+name: vai
+
+on:
+  push:
+    branches:
+      - master
+    paths:
+      - 'vai/**'
+
+  pull_request:
+    paths:
+      - 'vai/**'
+
+  workflow_dispatch: {}
+
+defaults:
+  run:
+    working-directory: ./vai
+
+jobs:
+  vai:
+    runs-on: ubuntu-latest
+    timeout-minutes: 15
+    steps:
+      - uses: actions/checkout@v4
+      - uses: pnpm/action-setup@v3.0.0
+        with:
+          version: 8.6.2
+      - run: pnpm install --frozen-lockfile
+      - run: pnpm build
+      - run: pnpm test
+        env:
+          CLOUD_BOT_ID: ${{ secrets.CLOUD_BOT_ID }}
+          CLOUD_PAT: ${{ secrets.CLOUD_PAT }}
+      - name: Publish
+        if: github.ref == 'refs/heads/master' || github.event_name == 'workflow_dispatch'
+        uses: botpress/gh-actions/publish-if-not-exists@master
+        with:
+          path: './vai'
+          token: '${{ secrets.NPM_ACCESS_TOKEN }}'
@@ -0,0 +1,37 @@
+name: wasm
+
+on:
+  push:
+    branches:
+      - master
+    paths:
+      - 'wasm/**'
+
+  pull_request:
+    paths:
+      - 'wasm/**'
+
+  workflow_dispatch: {}
+
+defaults:
+  run:
+    working-directory: ./wasm
+
+jobs:
+  wasm:
+    runs-on: ubuntu-latest
+    timeout-minutes: 15
+    steps:
+      - uses: actions/checkout@v4
+      - uses: pnpm/action-setup@v3.0.0
+        with:
+          version: 8.6.2
+      - run: pnpm install --frozen-lockfile
+      - run: pnpm build
+      - run: pnpm test
+      - name: Publish
+        if: github.ref == 'refs/heads/master' || github.event_name == 'workflow_dispatch'
+        uses: botpress/gh-actions/publish-if-not-exists@master
+        with:
+          path: './wasm'
+          token: '${{ secrets.NPM_ACCESS_TOKEN }}'
@@ -0,0 +1,40 @@
+name: zai
+
+on:
+  push:
+    branches:
+      - master
+    paths:
+      - 'zai/**'
+
+  pull_request:
+    paths:
+      - 'zai/**'
+
+  workflow_dispatch: {}
+
+defaults:
+  run:
+    working-directory: ./zai
+
+jobs:
+  zai:
+    runs-on: ubuntu-latest
+    timeout-minutes: 15
+    steps:
+      - uses: actions/checkout@v4
+      - uses: pnpm/action-setup@v3.0.0
+        with:
+          version: 8.6.2
+      - run: pnpm install --frozen-lockfile
+      - run: pnpm build
+      - run: pnpm test
+        env:
+          CLOUD_BOT_ID: ${{ secrets.CLOUD_BOT_ID }}
+          CLOUD_PAT: ${{ secrets.CLOUD_PAT }}
+      - name: Publish
+        if: github.ref == 'refs/heads/master' || github.event_name == 'workflow_dispatch'
+        uses: botpress/gh-actions/publish-if-not-exists@master
+        with:
+          path: './zai'
+          token: '${{ secrets.NPM_ACCESS_TOKEN }}'
@@ -0,0 +1,3 @@
+{
+  "vitest.disableWorkspaceWarning": true
+}
@@ -0,0 +1,7 @@
+src/
+node_modules/
+*.test.ts
+*.test.js
+.env
+.env.local
+.turbo
@@ -0,0 +1,163 @@
+# Vitest AI
+
+**Vai** (stands for _Vitest + AI_) is a lightweight vitest extension that uses LLMs to do assertions.
+The goal of this library is primarily to allow testing the output of LLMs like the new autonomous engine, as the output is dynamic and qualitative we can't rely on traditional hard-coded tests.
+
+To remove the flakiness and human-input from these tests, we need LLMs.
+
+It's built on top of Zui and the Botpress client to interface with the different LLMs.
+
+## Usage
+
+```typescript
+import { check, rate, filter, extract } from '@botpress/vai'
+import { describe, test } from 'vitest'
+
+describe('my test suite', () => {
+  test('example', () => {
+    check('botpress', 'is a chatbot company').toBe(true)
+  })
+})
+```
+
+## `check (assertion)`
+
+Checks that the provided value matches the provided condition
+
+```typescript
+test('example', () => {
+  // works with strings
+  check('hello', 'is a greeting message').toBe(true)
+
+  // also works with objects, arrays etc..
+  check(
+    {
+      message: 'hello my friend',
+      from: 'user'
+    },
+    'is a greeting message'
+  ).toBe(true)
+})
+```
+
+## `extract (assertion)`
+
+Extracts from anything in input the requested Zui Schema:
+
+```typescript
+const person = z.object({
+  name: z.string(),
+  age: z.number().optional(),
+  country: z.string().optional()
+})
+
+extract('My name is Sylvain, I am 33 yo and live in Canada', person).toMatchObject({
+  name: 'Sylvain',
+  age: 33,
+  country: 'Canada'
+})
+```
+
+Also added support for `toMatchInlineSnapshot`:
+
+```typescript
+test('toMatchInlineSnapshot', () => {
+  extract('My name is Eric!', z.object({ name: z.string() })).toMatchInlineSnapshot(`
+    {
+      "name": "Eric",
+    }
+  `)
+})
+```
+
+## `filter (assertion)`
+
+Filters an array of anything `T[]` based on a provided condition:
+
+```typescript
+const countries = ['canada', 'germany', 'usa', 'paris', 'mexico']
+filter(countries, 'is in north america').toBe(['canada', 'usa', 'mexico'])
+filter(countries, 'is the name of a country').length.toBe(4)
+```
+
+## `rate (assertion)`
+
+Given any input `T`, gives a rating between `1` (worst) and `5` (best):
+
+```typescript
+test('good', () => rate('ghandi', 'is a good person').toBeGreaterThanOrEqual(4))
+test('evil', () => rate('hitler', 'is a good person').toBe(3))
+```
+
+## Few-shot Examples
+
+All assertion methods accept examples to provide the LLM with few-shot learning and help increase the accuracy.
+
+```typescript
+describe('learns from examples', () => {
+  test('examples are used to understand how to classify correctly', () => {
+    const examples = [
+      {
+        expected: true,
+        value: 'Rasa the chatbot framework',
+        reason: 'Rasa is a chatbot framework, so it competes with Botpress'
+      },
+      {
+        expected: false,
+        value: 'Rasa the coffee company',
+        reason: 'Since Rasa is a coffee company, it does not compete with Botpress which is not in the coffee business'
+      }
+    ]
+
+    check('Voiceflow', 'is competitor', { examples }).toBe(true)
+    check('Toyota', 'is competitor', { examples }).toBe(false)
+  })
+})
+```
+
+## Failure Messages
+
+All model predictions have nice failure messages by default:
+
+```typescript
+const countries = ['canada', 'germany', 'usa', 'paris', 'mexico']
+filter(countries, 'is in north america').toBe(['canada', 'usa'])
+```
+
+## Promises
+
+All assertion methods can also be used outside Vitest tests, as they return an `PromiseLike<T>` object that can be awaited.
+
+```typescript
+test('test truth', async () => {
+  const { result } = await check('hello', 'is a greeting message')
+  expect(result).toBe(true)
+})
+```
+
+## Bail on failure
+
+You can await the assertion to bail immediately on failure and prevent other test cases to run:
+
+```typescript
+test('no bail', () => {
+  check('hello', 'is a greeting message').toBe(false)
+  console.log('this will run as the above is not awaited, it will bail at the end of the test')
+})
+
+test('bail', async () => {
+  await check('hello', 'is a greeting message').toBe(false)
+  console.log('this will not run, the test has bailed')
+})
+```
+
+## Changing the evaluator model
+
+By default, GPT-4o mini is used to evaluate the tests, but the evaluator can be changed from inside a test:
+
+```typescript
+test('simple', () => {
+  setEvaluator('anthropic__claude-3-5-sonnet-20240620')
+  rate('hello', 'is a greeting message').toBe(5)
+})
+```
@@ -0,0 +1,9 @@
+;(function () {
+  if (!process.env.CLOUD_BOT_ID) {
+    throw new Error('Env: CLOUD_BOT_ID is required')
+  }
+
+  if (!process.env.CLOUD_PAT) {
+    throw new Error('Env: CLOUD_PAT is required')
+  }
+})()
@@ -0,0 +1,46 @@
+{
+  "name": "@botpress/vai",
+  "version": "0.0.5",
+  "description": "Vitest AI (vai) – a vitest extension for testing with LLMs",
+  "exports": {
+    ".": {
+      "types": "./dist/index.d.ts",
+      "import": "./dist/index.js",
+      "require": "./dist/index.js"
+    }
+  },
+  "scripts": {
+    "build": "npm run build:types && npm run build:neutral",
+    "build:neutral": "esbuild src/**/*.ts src/*.ts --platform=neutral --outdir=dist",
+    "build:types": "tsup",
+    "watch": "tsup --watch",
+    "test": "vitest run --config vitest.config.ts",
+    "test:update": "vitest -u run --config vitest.config.ts",
+    "test:watch": "vitest --config vitest.config.ts",
+    "build-with-latest-models": "pnpm run update-types && pnpm run update-models && pnpm run build",
+    "update-models": "ts-node ./src/scripts/update-models.ts",
+    "update-types": "ts-node ./src/scripts/update-types.ts"
+  },
+  "keywords": [],
+  "author": "",
+  "license": "ISC",
+  "dependencies": {
+    "json5": "^2.2.1",
+    "jsonrepair": "^3.2.0"
+  },
+  "devDependencies": {
+    "@types/lodash": "^4.17.0",
+    "dotenv": "^16.3.1",
+    "esbuild": "^0.24.2",
+    "ts-node": "^10.9.2",
+    "tsup": "^8.3.5",
+    "typescript": "^5.7.2"
+  },
+  "peerDependencies": {
+    "@botpress/client": "^0.40.0",
+    "@botpress/wasm": "^1.0.1",
+    "@bpinternal/zui": "^0.13.4",
+    "lodash": "^4.17.21",
+    "vitest": "^2 || ^3 || ^4 || ^5"
+  }
+}
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+{`
	`2`	`+ "vitest.disableWorkspaceWarning": true`
	`3`	`+}`