docs: DeepSeek

giladgd · giladgd · commit e5ac7325d955 · 2025-02-21T03:52:57.000+02:00
diff --git a/.vitepress/components/YouTubePlayer/YouTubePlayer.vue b/.vitepress/components/YouTubePlayer/YouTubePlayer.vue
@@ -0,0 +1,50 @@
+<script setup lang="ts">
+import {computed} from "vue";
+const props = withDefaults(defineProps<{
+    id: string,
+    autoplay?: boolean,
+    controls?: boolean
+}>(), {
+    autoplay: false,
+    controls: true
+});
+
+const url = computed(() => {
+    const res = new URL(`https://www.youtube.com/embed/${props.id}`);
+    res.searchParams.set("origin", location.origin);
+    res.searchParams.set("autoplay", props.autoplay ? "1" : "0");
+    res.searchParams.set("controls", props.controls ? "1" : "0");
+    res.searchParams.set("playsinline", "1");
+    res.searchParams.set("rel", "0");
+
+    return res.href;
+});
+</script>
+
+<template>
+    <div class="youtubePlayer" v-if="url">
+        <iframe
+            class="player"
+            :src="url"
+            allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
+            allowfullscreen
+        />
+    </div>
+</template>
+
+<style scoped>
+.youtubePlayer {
+    margin-top: 1em;
+    overflow: hidden;
+    border-radius: 12px;
+    background-color: color-mix(in srgb, var(--vp-c-text-1) 6%, transparent);
+
+    > .player {
+        width: 100%;
+        aspect-ratio: 16 / 9;
+        min-height: 240px;
+        max-height: 600px;
+        border: none;
+    }
+}
+</style>
diff --git a/.vitepress/theme/LayoutContainer.vue b/.vitepress/theme/LayoutContainer.vue
@@ -16,10 +16,9 @@ if (typeof document !== "undefined")
     document?.documentElement.classList.toggle("theme-transition", themeTransitionEnabled);
 
 function updateIsBlogPage() {
-    document?.documentElement.classList.toggle(
-        "blog-page",
-        route.path !== "/blog/" && route.path.startsWith("/blog/")
-    );
+    const blogIndex = route.path === "/blog/";
+    document?.documentElement.classList.toggle("blog-page", !blogIndex && route.path.startsWith("/blog/"));
+    document?.documentElement.classList.toggle("blog-index", blogIndex);
 }
 
 watch(() => route.path, updateIsBlogPage);
diff --git a/.vitepress/theme/index.ts b/.vitepress/theme/index.ts
@@ -9,6 +9,7 @@ import LatestVersionHomeBadge from "../components/LatestVersionHomeBadge/LatestV
 import CommentsSection from "../components/CommentsSection/CommentsSection.vue";
 import {NolebaseGitChangelogPlugin} from "@nolebase/vitepress-plugin-git-changelog/client";
 import LayoutContainer from "./LayoutContainer.vue";
+import YouTubePlayer from "../components/YouTubePlayer/YouTubePlayer.vue";
 
 import "./style.css";
 import "@nolebase/vitepress-plugin-git-changelog/client/style.css";
@@ -18,9 +19,9 @@ import type {EnhanceAppContext} from "vitepress";
 export default {
     extends: Theme,
     Layout: () => {
-        const text = "v3.0 is here!";
-        const link = "/blog/v3";
-        const hideDate = new Date("2025-01-01T00:00:00Z");
+        const text = "DeepSeek R1 is here!";
+        const link = "/blog/v3.6-deepseek-r1";
+        const hideDate = new Date("2025-06-01T00:00:00Z");
 
         return h(LayoutContainer, null, h(Theme.Layout, null, {
             "home-hero-info-before": () => h(LatestVersionHomeBadge, {
@@ -35,6 +36,7 @@ export default {
         }));
     },
     enhanceApp({app, router, siteData}: EnhanceAppContext) {
+        app.component("YouTubePlayer", YouTubePlayer);
         app.use(TwoslashFloatingVue);
         app.use(NolebaseGitChangelogPlugin, {
             displayAuthorsInsideCommitLine: true,
diff --git a/.vitepress/theme/style.css b/.vitepress/theme/style.css
@@ -562,6 +562,15 @@ html.blog-page .vp-doc>div>hr:first-of-type {
     display: none;
 }
 
+@media (min-width: 960px) {
+    html.blog-index .VPDoc:not(.has-sidebar)>.container>.content,
+    html.blog-page .VPDoc:not(.has-sidebar)>.container>.content {
+        max-width: 896px;
+        padding-left: 0px;
+        padding-right: 0px;
+    }
+}
+
 /*#VPContent {*/
 /*    background-image: radial-gradient(1200px 380px at 50% 0%, color-mix(in srgb, var(--vp-c-brand-1) 32%, transparent), transparent 64%);*/
 /*}*/
diff --git a/README.md b/README.md
@@ -15,7 +15,7 @@
 
 </div>
 
-✨ [`v3.0` is here!](https://node-llama-cpp.withcat.ai/blog/v3) ✨
+✨ [DeepSeek R1 is here!](https://node-llama-cpp.withcat.ai/blog/v3.6-deepseek-r1) ✨
 
 ## Features
 * Run LLMs locally on your machine
diff --git a/docs/blog/v3.6-deepseek-r1.md b/docs/blog/v3.6-deepseek-r1.md
@@ -0,0 +1,129 @@
+---
+title: DeepSeek R1 with function calling
+date: 2025-02-20T22:00:00Z
+lastUpdated: false
+author:
+    name: Gilad S.
+    github: giladgd
+category: Release
+description: node-llama-cpp v3.6 is here, with full support for DeepSeek R1, including function calling!
+image:
+    url: https://github.com/user-attachments/assets/9ed954f8-102d-4cdd-96d8-9b6710b8a1f5
+    alt: "node-llama-cpp + DeepSeek R1"
+    width: 3072
+    height: 1536
+---
+[`node-llama-cpp`](https://node-llama-cpp.withcat.ai) v3.6 is here, with full support for [DeepSeek R1](https://github.com/deepseek-ai/DeepSeek-R1), including function calling!
+
+---
+
+## Function Calling
+`node-llama-cpp` includes [many tricks](../guide/function-calling) used to make function calling work with most models.
+This release includes special adaptations for DeepSeek R1 to improve function calling performance and stability.
+
+Here's a basic example of function calling with DeepSeek R1:
+```typescript
+import {fileURLToPath} from "url";
+import path from "path";
+import {
+    getLlama, LlamaChatSession, defineChatSessionFunction, resolveModelFile
+} from "node-llama-cpp";
+
+const __dirname = path.dirname(fileURLToPath(import.meta.url));
+const modelsDir = path.join(__dirname, "..", "models");
+
+const modelUri = "hf:mradermacher/DeepSeek-R1-Distill-Qwen-7B-GGUF:Q4_K_M";
+
+
+const llama = await getLlama();
+const model = await llama.loadModel({
+    modelPath: await resolveModelFile(modelUri, modelsDir)
+});
+const context = await model.createContext();
+const session = new LlamaChatSession({
+    contextSequence: context.getSequence()
+});
+
+const fruitPrices: Record<string, string> = {
+    "apple": "$6",
+    "banana": "$4"
+};
+const functions = {
+    getFruitPrice: defineChatSessionFunction({
+        description: "Get the price of a fruit",
+        params: {
+            type: "object",
+            properties: {
+                name: {
+                    type: "string"
+                }
+            }
+        },
+        async handler(params) {
+            const name = params.name.toLowerCase();
+            if (Object.keys(fruitPrices).includes(name))
+                return {
+                    name: name,
+                    price: fruitPrices[name]
+                };
+
+            return `Unrecognized fruit "${params.name}"`;
+        }
+    })
+};
+
+
+const q1 = "Is an apple more expensive than a banana?";
+console.log("User: " + q1);
+
+const a1 = await session.prompt(q1, {functions});
+console.log("AI: " + a1.trim());
+```
+
+
+## Recommended Models
+Here are some recommended model URIs you can use to try out DeepSeek R1 with function calling.
+
+| Model                                                                                                   | Size   | URI                                                         |
+|---------------------------------------------------------------------------------------------------------|--------|-------------------------------------------------------------|
+| [DeepSeek R1 Distill Qwen 7B](https://huggingface.co/mradermacher/DeepSeek-R1-Distill-Qwen-7B-GGUF)     | 4.68GB | `hf:mradermacher/DeepSeek-R1-Distill-Qwen-7B-GGUF:Q4_K_M`   |
+| [DeepSeek R1 Distill Qwen 14B](https://huggingface.co/mradermacher/DeepSeek-R1-Distill-Qwen-14B-GGUF)   | 8.99GB | `hf:mradermacher/DeepSeek-R1-Distill-Qwen-14B-GGUF:Q4_K_M`  |
+| [DeepSeek R1 Distill Qwen 32B](https://huggingface.co/mradermacher/DeepSeek-R1-Distill-Qwen-32B-GGUF)   | 23.3GB | `hf:mradermacher/DeepSeek-R1-Distill-Qwen-32B-GGUF:Q4_K_M`  |
+
+::: info TIP
+Estimate the compatibility of a model with your machine before downloading it using the [`inspect estimate`](../cli/inspect/estimate.md) command:
+```shell
+npx -y node-llama-cpp inspect estimate <model URI>
+```
+:::
+
+### Try It Using the CLI
+To try out function calling with a given model using the CLI, you can use the [`chat` command](../cli/chat.md) with the `--ef` flag
+to provide the model with date and time functions:
+
+```shell
+npx -y node-llama-cpp chat --ef --prompt "What is the time?" <model URI>
+```
+
+
+## Chain of Thought Segmentation
+The thoughts generated by a reasoning model are now [separated into `thought` segments](../guide/chat-session.md#stream-response-segments) in the response,
+so you can choose whether to use them or not.
+
+By default, the [`.prompt(...)`](../api/classes/LlamaChatSession#prompt) method returns only the main response, without any `thought` segments.
+Use the [`.promptWithMeta(...)`](../api/classes/LlamaChatSession#promptwithmeta) method to get the full response.
+
+You can use the new [`onResponseChunk`](../api/type-aliases/LLamaChatPromptOptions.md#onresponsechunk) option to [stream `thought` segments as they are being generated](../guide/chat-session.md#stream-response-segments).
+
+
+## Electron App Template
+The [Electron app template](../guide/electron.md) has been updated to properly segment the thoughts in the response.
+
+Try it out by downloading the latest build [from GitHub](https://github.com/withcatai/node-llama-cpp/releases/latest),
+or by [scaffolding a new project](../guide/index.md#scaffold-new-project) based on the Electron template:
+
+```shell
+npm create node-llama-cpp@latest
+```
+
+<YouTubePlayer id="IqfMs0lfIvQ" />
diff --git a/package.json b/package.json
@@ -110,6 +110,7 @@
     "local",
     "catai",
     "mistral",
+    "deepseek",
     "typescript",
     "lora",
     "batching",