SciSharp
diff --git a/‎.github/workflows/compile.yml
Lines changed: 14 additions & 14 deletions b/‎.github/workflows/compile.yml
Lines changed: 14 additions & 14 deletions
diff --git a/‎.github/workflows/stale_issues.yml
Lines changed: 20 additions & 0 deletions b/‎.github/workflows/stale_issues.yml
Lines changed: 20 additions & 0 deletions
diff --git a/‎LLama.Examples/Examples/KernelMemory.cs
Lines changed: 1 addition & 1 deletion b/‎LLama.Examples/Examples/KernelMemory.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎LLama.Examples/Examples/KernelMemorySaveAndLoad.cs
Lines changed: 1 addition & 1 deletion b/‎LLama.Examples/Examples/KernelMemorySaveAndLoad.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎LLama.Examples/LLama.Examples.csproj
Lines changed: 6 additions & 6 deletions b/‎LLama.Examples/LLama.Examples.csproj
Lines changed: 6 additions & 6 deletions
diff --git a/‎LLama.KernelMemory/LLamaSharpTextEmbeddingGenerator.cs
Lines changed: 10 additions & 8 deletions b/‎LLama.KernelMemory/LLamaSharpTextEmbeddingGenerator.cs
Lines changed: 10 additions & 8 deletions
diff --git a/‎LLama.KernelMemory/LlamaSharpTextGenerator.cs
Lines changed: 4 additions & 2 deletions b/‎LLama.KernelMemory/LlamaSharpTextGenerator.cs
Lines changed: 4 additions & 2 deletions
diff --git a/‎LLama.SemanticKernel/LLamaSharp.SemanticKernel.csproj
Lines changed: 1 addition & 1 deletion b/‎LLama.SemanticKernel/LLamaSharp.SemanticKernel.csproj
Lines changed: 1 addition & 1 deletion
diff --git a/‎LLama.Unittest/Constants.cs
Lines changed: 2 additions & 2 deletions b/‎LLama.Unittest/Constants.cs
Lines changed: 2 additions & 2 deletions
diff --git a/‎LLama.Unittest/KernelMemory/ITextTokenizerTests.cs
Lines changed: 1 addition & 1 deletion b/‎LLama.Unittest/KernelMemory/ITextTokenizerTests.cs
Lines changed: 1 addition & 1 deletion
@@ -17,7 +17,7 @@ concurrency:
 
 env:
   # Compiler defines common to all platforms
-  COMMON_DEFINE: -DGGML_NATIVE=OFF -DLLAMA_BUILD_TESTS=OFF -DLLAMA_BUILD_EXAMPLES=ON -DLLAMA_BUILD_SERVER=OFF -DBUILD_SHARED_LIBS=ON
+  COMMON_DEFINE: -DGGML_NATIVE=OFF -DLLAMA_BUILD_TESTS=OFF -DLLAMA_BUILD_EXAMPLES=ON -DLLAMA_BUILD_SERVER=OFF -DBUILD_SHARED_LIBS=ON -DLLAMA_CURL=OFF
 
 jobs:
   compile-linux:
@@ -28,23 +28,23 @@ jobs:
         include:
           - build: 'noavx'
             defines: '-DGGML_AVX=OFF -DGGML_AVX2=OFF -DGGML_FMA=OFF'
-            os: ubuntu-20.04
+            os: ubuntu-24.04
             arch: x64
           - build: 'avx2'
             defines: ''
-            os: ubuntu-20.04
+            os: ubuntu-24.04
             arch: x64
           - build: 'avx'
             defines: '-DGGML_AVX2=OFF'
-            os: ubuntu-20.04
+            os: ubuntu-24.04
             arch: x64
           - build: 'avx512'
             defines: '-DGGML_AVX512=ON'
-            os: ubuntu-20.04
+            os: ubuntu-24.04
             arch: x64
           - build: 'aarch64'
             defines: '-DGGML_NATIVE=OFF -DGGML_CPU_AARCH64=ON -DGGML_CPU_ARM_ARCH=armv8-a'
-            os: ubuntu-22.04-arm
+            os: ubuntu-24.04-arm
             arch: arm64
     runs-on: ${{ matrix.os }}
     steps:
@@ -102,7 +102,7 @@ jobs:
             defines: '-DGGML_AVX2=OFF'
           - build: 'avx512'
             defines: '-DGGML_AVX512=ON'
-    runs-on: ubuntu-20.04
+    runs-on: ubuntu-24.04
     container:
       image: alpine:latest
     steps:
@@ -346,7 +346,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        os: [ubuntu-20.04, windows-2019]
+        os: [ubuntu-22.04, windows-2019]
         cuda: ['12.2.0', '11.7.1']
     runs-on: ${{ matrix.os }}
     steps:
@@ -421,35 +421,35 @@ jobs:
           if-no-files-found: error
 
       - name: Upload artifacts (Linux)
-        if: ${{ matrix.os == 'ubuntu-20.04' }}
+        if: ${{ matrix.os == 'ubuntu-22.04' }}
         uses: actions/upload-artifact@v4
         with:
           path: ./build/bin/libllama.so
           name: llama-bin-linux-cublas-cu${{ matrix.cuda }}-x64.so
           if-no-files-found: error
       - name: Upload artifacts ggml (Linux)
-        if: ${{ matrix.os == 'ubuntu-20.04' }}
+        if: ${{ matrix.os == 'ubuntu-22.04' }}
         uses: actions/upload-artifact@v4
         with:
           path: ./build/bin/libggml.so
           name: ggml-bin-linux-cublas-cu${{ matrix.cuda }}-x64.so
           if-no-files-found: error
       - name: Upload artifacts ggml-base (Linux)
-        if: ${{ matrix.os == 'ubuntu-20.04' }}
+        if: ${{ matrix.os == 'ubuntu-22.04' }}
         uses: actions/upload-artifact@v4
         with:
           path: ./build/bin/libggml-base.so
           name: ggml-base-bin-linux-cublas-cu${{ matrix.cuda }}-x64.so
           if-no-files-found: error
       - name: Upload artifacts ggml-cuda (Linux)
-        if: ${{ matrix.os == 'ubuntu-20.04' }}
+        if: ${{ matrix.os == 'ubuntu-22.04' }}
         uses: actions/upload-artifact@v4
         with:
           path: ./build/bin/libggml-cuda.so
           name: ggml-cuda-bin-linux-cublas-cu${{ matrix.cuda }}-x64.so
           if-no-files-found: error
       - name: Upload llava artifacts (Linux)
-        if: ${{ matrix.os == 'ubuntu-20.04' }}
+        if: ${{ matrix.os == 'ubuntu-22.04' }}
         uses: actions/upload-artifact@v4
         with:
           path: ./build/bin/libllava_shared.so
@@ -552,7 +552,7 @@ jobs:
             defines: '-DANDROID_ABI=x86_64'
           - build: 'arm64-v8a'
             defines: '-DANDROID_ABI=arm64-v8a'
-    runs-on: ubuntu-20.04
+    runs-on: ubuntu-24.04
     steps:
       - uses: actions/checkout@v4
         with:
 
@@ -0,0 +1,20 @@
+name: Close stale issues
+
+on:
+  schedule:
+    - cron: '0 0 * * *'
+
+jobs:
+  stale:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/stale@v9
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
+          stale-issue-message: 'This issue has been automatically marked as stale due to inactivity. If no further activity occurs, it will be closed in 7 days.'
+          stale-pr-message: 'This pull request has been automatically marked as stale due to inactivity. If no further activity occurs, it will be closed in 7 days.'
+          days-before-stale: 60
+          days-before-close: 7
+          stale-issue-label: 'stale'
+          exempt-issue-labels: 'do not close'
+          operations-per-run: 30
@@ -46,7 +46,7 @@ and answer questions about them in an interactive chat prompt.
 
             // Ask a predefined question
             Console.ForegroundColor = ConsoleColor.Green;
-            string question1 = "What formats does KM support";
+            string question1 = "What is Kernel Memory";
             Console.WriteLine($"Question: {question1}");
             await AnswerQuestion(memory, question1);
 
 
@@ -54,7 +54,7 @@ Press ENTER to proceed...
             await IngestDocuments(memory);
         }
 
-        await AskSingleQuestion(memory, "What formats does KM support?");
+        await AskSingleQuestion(memory, "What is Kernel Memory");
         await StartUserChatSession(memory);
     }
 
 
@@ -15,15 +15,15 @@
 
   <ItemGroup>
     <PackageReference Include="Microsoft.Extensions.Logging.Console" Version="9.0.3" />
-    <PackageReference Include="Microsoft.KernelMemory.Core" Version="0.97.250211.1" />
+    <PackageReference Include="Microsoft.KernelMemory.Core" Version="0.98.250323.1" />
     <PackageReference Include="Microsoft.SemanticKernel" Version="1.44.0" />
-    <PackageReference Include="Microsoft.SemanticKernel.Plugins.Memory" Version="1.6.2-alpha" />
+    <PackageReference Include="Microsoft.SemanticKernel.Plugins.Memory" Version="1.44.0-alpha" />
     <PackageReference Include="NAudio" Version="2.2.1" />
     <PackageReference Include="SixLabors.ImageSharp" Version="3.1.7" />
-    <PackageReference Include="Spectre.Console" Version="0.49.1" />
-    <PackageReference Include="Spectre.Console.ImageSharp" Version="0.49.1" />
-    <PackageReference Include="Whisper.net" Version="1.7.4" />
-    <PackageReference Include="Whisper.net.Runtime" Version="1.7.4" />
+    <PackageReference Include="Spectre.Console" Version="0.50.0" />
+    <PackageReference Include="Spectre.Console.ImageSharp" Version="0.50.0" />
+    <PackageReference Include="Whisper.net" Version="1.8.1" />
+    <PackageReference Include="Whisper.net.Runtime" Version="1.8.1" />
     <PackageReference Include="Whisper.net.Runtime.Clblast" Version="1.5.0" />
     <PackageReference Include="Whisper.net.Runtime.CoreML" Version="1.7.4" />
     <PackageReference Include="Whisper.net.Runtime.Cublas" Version="1.5.0" />
 
@@ -31,9 +31,11 @@ public LLamaSharpTextEmbeddingGenerator(LLamaSharpConfig config)
 
             var @params = new ModelParams(config.ModelPath)
             {
-                ContextSize = config.ContextSize,
-                GpuLayerCount = config.GpuLayerCount ?? 20,
-
+                ContextSize = config?.ContextSize ?? 2048,
+                GpuLayerCount = config?.GpuLayerCount ?? 20,
+                //Embeddings = true,
+                MainGpu = config?.MainGpu ?? 0,
+                SplitMode = config?.SplitMode ?? LLama.Native.GPUSplitMode.None,
                 PoolingType = LLamaPoolingType.Mean,
             };
 
@@ -54,11 +56,11 @@ public LLamaSharpTextEmbeddingGenerator(LLamaSharpConfig config, LLamaWeights we
 
             var @params = new ModelParams(config.ModelPath)
             {
-                ContextSize = config.ContextSize ?? 2048,
-                GpuLayerCount = config.GpuLayerCount ?? 20,
-                Embeddings = true,
-                MainGpu = config.MainGpu,
-                SplitMode = config.SplitMode,
+                ContextSize = config?.ContextSize ?? 2048,
+                GpuLayerCount = config?.GpuLayerCount ?? 20,
+                //Embeddings = true,
+                MainGpu = config?.MainGpu ?? 0,
+                SplitMode = config?.SplitMode ?? LLama.Native.GPUSplitMode.None,
                 PoolingType = LLamaPoolingType.Mean,
             };
             _weights = weights;
 
@@ -32,8 +32,10 @@ public LlamaSharpTextGenerator(LLamaSharpConfig config)
         {
             var parameters = new ModelParams(config.ModelPath)
             {
-                ContextSize = config.ContextSize ?? 2048,
-                GpuLayerCount = config.GpuLayerCount ?? 20,
+                ContextSize = config?.ContextSize ?? 2048,
+                GpuLayerCount = config?.GpuLayerCount ?? 20,
+                MainGpu = config?.MainGpu ?? 0,
+                SplitMode = config?.SplitMode ?? LLama.Native.GPUSplitMode.None,
             };
             _weights = LLamaWeights.LoadFromFile(parameters);
             _context = _weights.CreateContext(parameters);
 
@@ -34,7 +34,7 @@
 	</PropertyGroup>
 
 	<ItemGroup>
-		<PackageReference Include="Microsoft.SemanticKernel.Abstractions" Version="1.44.0" />
+		<PackageReference Include="Microsoft.SemanticKernel.Abstractions" Version="1.48.0" />
 	</ItemGroup>
 
 	<ItemGroup Condition="'$(TargetFramework)' == 'netstandard2.0'">
 
@@ -21,15 +21,15 @@ public static int CIGpuLayerCount
         {
             get
             {
-                if (RuntimeInformation.IsOSPlatform(OSPlatform.OSX))
+                //if (RuntimeInformation.IsOSPlatform(OSPlatform.OSX))
                 {
                     #if DEBUG
                       return 20;
                     #else
                       return 0;                      
                     #endif
                 }
-                else return 20;
+                //else return 20;
             }
         }
     }
 
@@ -22,7 +22,7 @@ public ITextTokenizerTests(ITestOutputHelper testOutputHelper)
             _testOutputHelper = testOutputHelper;
 
             _infParams = new() { AntiPrompts = ["\n\n"] };
-            _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams, ContextSize = 512 };
+            _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams, ContextSize = 512, SplitMode = LLama.Native.GPUSplitMode.Layer };
 
             testOutputHelper.WriteLine($"Using model {Path.GetFileName(_lsConfig.ModelPath)}");
         }
Original file line number	Diff line number	Diff line change
`@@ -54,7 +54,7 @@ Press ENTER to proceed...`
`54`	`54`	`await IngestDocuments(memory);`
`55`	`55`	`}`
`56`	`56`
`57`		`- await AskSingleQuestion(memory, "What formats does KM support?");`
	`57`	`+ await AskSingleQuestion(memory, "What is Kernel Memory");`
`58`	`58`	`await StartUserChatSession(memory);`
`59`	`59`	`}`
`60`	`60`
Original file line number	Diff line number	Diff line change
`@@ -32,8 +32,10 @@ public LlamaSharpTextGenerator(LLamaSharpConfig config)`
`32`	`32`	`{`
`33`	`33`	`var parameters = new ModelParams(config.ModelPath)`
`34`	`34`	`{`
`35`		`- ContextSize = config.ContextSize ?? 2048,`
`36`		`- GpuLayerCount = config.GpuLayerCount ?? 20,`
	`35`	`+ ContextSize = config?.ContextSize ?? 2048,`
	`36`	`+ GpuLayerCount = config?.GpuLayerCount ?? 20,`
	`37`	`+ MainGpu = config?.MainGpu ?? 0,`
	`38`	`+ SplitMode = config?.SplitMode ?? LLama.Native.GPUSplitMode.None,`
`37`	`39`	`};`
`38`	`40`	`_weights = LLamaWeights.LoadFromFile(parameters);`
`39`	`41`	`_context = _weights.CreateContext(parameters);`
Original file line number	Diff line number	Diff line change
`@@ -21,15 +21,15 @@ public static int CIGpuLayerCount`
`21`	`21`	`{`
`22`	`22`	`get`
`23`	`23`	`{`
`24`		`- if (RuntimeInformation.IsOSPlatform(OSPlatform.OSX))`
	`24`	`+ //if (RuntimeInformation.IsOSPlatform(OSPlatform.OSX))`
`25`	`25`	`{`
`26`	`26`	`#if DEBUG`
`27`	`27`	`return 20;`
`28`	`28`	`#else`
`29`	`29`	`return 0;`
`30`	`30`	`#endif`
`31`	`31`	`}`
`32`		`- else return 20;`
	`32`	`+ //else return 20;`
`33`	`33`	`}`
`34`	`34`	`}`
`35`	`35`	`}`
Original file line number	Diff line number	Diff line change
`@@ -22,7 +22,7 @@ public ITextTokenizerTests(ITestOutputHelper testOutputHelper)`
`22`	`22`	`_testOutputHelper = testOutputHelper;`
`23`	`23`
`24`	`24`	`_infParams = new() { AntiPrompts = ["\n\n"] };`
`25`		`- _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams, ContextSize = 512 };`
	`25`	`+ _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams, ContextSize = 512, SplitMode = LLama.Native.GPUSplitMode.Layer };`
`26`	`26`
`27`	`27`	`testOutputHelper.WriteLine($"Using model {Path.GetFileName(_lsConfig.ModelPath)}");`
`28`	`28`	`}`