dpmm99
diff --git a/‎.github/workflows/compile.yml
Lines changed: 93 additions & 1 deletion b/‎.github/workflows/compile.yml
Lines changed: 93 additions & 1 deletion
diff --git a/‎LLama.Examples/LLama.Examples.csproj
Lines changed: 4 additions & 4 deletions b/‎LLama.Examples/LLama.Examples.csproj
Lines changed: 4 additions & 4 deletions
diff --git a/‎LLama.KernelMemory/LLamaSharp.KernelMemory.csproj
Lines changed: 2 additions & 2 deletions b/‎LLama.KernelMemory/LLamaSharp.KernelMemory.csproj
Lines changed: 2 additions & 2 deletions
diff --git a/‎LLama.KernelMemory/LLamaSharpTextEmbeddingGenerator.cs
Lines changed: 2 additions & 1 deletion b/‎LLama.KernelMemory/LLamaSharpTextEmbeddingGenerator.cs
Lines changed: 2 additions & 1 deletion
diff --git a/‎LLama.SemanticKernel/LLamaSharp.SemanticKernel.csproj
Lines changed: 3 additions & 3 deletions b/‎LLama.SemanticKernel/LLamaSharp.SemanticKernel.csproj
Lines changed: 3 additions & 3 deletions
diff --git a/‎LLama.Unittest/KernelMemory/ITextTokenizerTests.cs
Lines changed: 1 addition & 1 deletion b/‎LLama.Unittest/KernelMemory/ITextTokenizerTests.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎LLama.Unittest/LLama.Unittest.csproj
Lines changed: 3 additions & 3 deletions b/‎LLama.Unittest/LLama.Unittest.csproj
Lines changed: 3 additions & 3 deletions
diff --git a/‎LLama.Unittest/LLamaContextTests.cs
Lines changed: 14 additions & 0 deletions b/‎LLama.Unittest/LLamaContextTests.cs
Lines changed: 14 additions & 0 deletions
diff --git a/‎LLama.Unittest/LLamaEmbedderTests.cs
Lines changed: 2 additions & 2 deletions b/‎LLama.Unittest/LLamaEmbedderTests.cs
Lines changed: 2 additions & 2 deletions
diff --git a/‎LLama.Web/Common/InferenceOptions.cs
Lines changed: 1 addition & 1 deletion b/‎LLama.Web/Common/InferenceOptions.cs
Lines changed: 1 addition & 1 deletion
@@ -76,6 +76,72 @@ jobs:
           name: llava-bin-linux-${{ matrix.build }}-x64.so
           if-no-files-found: error
 
+  compile-musl:
+    name: Compile (musl)
+    strategy:
+      fail-fast: true
+      matrix:
+        include:
+          - build: 'noavx'
+            defines: '-DGGML_AVX=OFF -DGGML_AVX2=OFF -DGGML_FMA=OFF'
+          - build: 'avx2'
+            defines: ''
+          - build: 'avx'
+            defines: '-DGGML_AVX2=OFF'
+          - build: 'avx512'
+            defines: '-DGGML_AVX512=ON'
+    runs-on: ubuntu-20.04
+    container:
+      image: alpine:latest
+    steps:
+      - name: Install dependencies
+        run: |
+          apk update && apk add --no-cache \
+            build-base \
+            cmake \
+            git \
+            linux-headers \
+            g++
+      - uses: actions/checkout@v4
+        with:
+          repository: ggerganov/llama.cpp
+          fetch-depth: 0
+          ref: '${{ github.event.inputs.llama_cpp_commit }}'
+      - name: Build
+        id: cmake_build_musl
+        run: |
+          mkdir build
+          cd build
+          cmake .. ${{ env.COMMON_DEFINE }} ${{ matrix.defines }}
+          cmake --build . --config Release -j ${env:NUMBER_OF_PROCESSORS}
+          ls -R
+      - uses: actions/upload-artifact@v4
+        with:
+          path: ./build/bin/libllama.so
+          name: llama-bin-musl-${{ matrix.build }}-x64.so
+          if-no-files-found: error
+      - uses: actions/upload-artifact@v4
+        with:
+          path: ./build/bin/libggml.so
+          name: ggml-bin-musl-${{ matrix.build }}-x64.so
+          if-no-files-found: error
+      - uses: actions/upload-artifact@v4
+        with:
+          path: ./build/bin/libggml-base.so
+          name: ggml-base-bin-musl-${{ matrix.build }}-x64.so
+          if-no-files-found: error
+      - uses: actions/upload-artifact@v4
+        with:
+          path: ./build/bin/libggml-cpu.so
+          name: ggml-cpu-bin-musl-${{ matrix.build }}-x64.so
+          if-no-files-found: error
+      - name: Upload Llava
+        uses: actions/upload-artifact@v4
+        with:
+          path: ./build/bin/libllava_shared.so
+          name: llava-bin-musl-${{ matrix.build }}-x64.so
+          if-no-files-found: error
+
   compile-windows:
     name: Compile (Windows)
     strategy:
@@ -528,6 +594,7 @@ jobs:
     if: ${{ always() }}
     needs: [
       "compile-linux",
+      "compile-musl",
       "compile-windows",
       "compile-vulkan",
       "compile-cublas",
@@ -543,7 +610,7 @@ jobs:
       - name: Rearrange Files
         run: |
           # Make all directories at once
-          mkdir --parents deps/{noavx,avx,avx2,avx512,osx-arm64,osx-x64,osx-x64-rosetta2,cu11.7.1,cu12.2.0,vulkan,android-arm64-v8a,android-x86,android-x86_64}
+          mkdir --parents deps/{noavx,avx,avx2,avx512,musl-noavx,musl-avx,musl-avx2,musl-avx512,osx-arm64,osx-x64,osx-x64-rosetta2,cu11.7.1,cu12.2.0,vulkan,android-arm64-v8a,android-x86,android-x86_64}
 
           # Linux
           cp artifacts/ggml-bin-linux-noavx-x64.so/libggml.so           deps/noavx/libggml.so
@@ -570,6 +637,31 @@ jobs:
           cp artifacts/llama-bin-linux-avx512-x64.so/libllama.so         deps/avx512/libllama.so
           cp artifacts/llava-bin-linux-avx512-x64.so/libllava_shared.so  deps/avx512/libllava_shared.so
 
+          # Musl
+          cp artifacts/ggml-bin-musl-noavx-x64.so/libggml.so           deps/musl-noavx/libggml.so
+          cp artifacts/ggml-base-bin-musl-noavx-x64.so/libggml-base.so deps/musl-noavx/libggml-base.so
+          cp artifacts/ggml-cpu-bin-musl-noavx-x64.so/libggml-cpu.so   deps/musl-noavx/libggml-cpu.so
+          cp artifacts/llama-bin-musl-noavx-x64.so/libllama.so         deps/musl-noavx/libllama.so
+          cp artifacts/llava-bin-musl-noavx-x64.so/libllava_shared.so  deps/musl-noavx/libllava_shared.so
+
+          cp artifacts/ggml-bin-musl-avx-x64.so/libggml.so             deps/musl-avx/libggml.so
+          cp artifacts/ggml-base-bin-musl-avx-x64.so/libggml-base.so   deps/musl-avx/libggml-base.so
+          cp artifacts/ggml-cpu-bin-musl-avx-x64.so/libggml-cpu.so     deps/musl-avx/libggml-cpu.so
+          cp artifacts/llama-bin-musl-avx-x64.so/libllama.so           deps/musl-avx/libllama.so
+          cp artifacts/llava-bin-musl-avx-x64.so/libllava_shared.so    deps/musl-avx/libllava_shared.so
+
+          cp artifacts/ggml-bin-musl-avx2-x64.so/libggml.so            deps/musl-avx2/libggml.so
+          cp artifacts/ggml-base-bin-musl-avx2-x64.so/libggml-base.so  deps/musl-avx2/libggml-base.so
+          cp artifacts/ggml-cpu-bin-musl-avx2-x64.so/libggml-cpu.so    deps/musl-avx2/libggml-cpu.so
+          cp artifacts/llama-bin-musl-avx2-x64.so/libllama.so          deps/musl-avx2/libllama.so
+          cp artifacts/llava-bin-musl-avx2-x64.so/libllava_shared.so   deps/musl-avx2/libllava_shared.so
+
+          cp artifacts/ggml-bin-musl-avx512-x64.so/libggml.so           deps/musl-avx512/libggml.so
+          cp artifacts/ggml-base-bin-musl-avx512-x64.so/libggml-base.so deps/musl-avx512/libggml-base.so
+          cp artifacts/ggml-cpu-bin-musl-avx512-x64.so/libggml-cpu.so   deps/musl-avx512/libggml-cpu.so
+          cp artifacts/llama-bin-musl-avx512-x64.so/libllama.so         deps/musl-avx512/libllama.so
+          cp artifacts/llava-bin-musl-avx512-x64.so/libllava_shared.so  deps/musl-avx512/libllava_shared.so
+
           # Windows
           cp artifacts/ggml-bin-win-noavx-x64.dll/ggml.dll            deps/noavx/ggml.dll
           cp artifacts/ggml-base-bin-win-noavx-x64.dll/ggml-base.dll  deps/noavx/ggml-base.dll
 
@@ -14,16 +14,16 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.Extensions.Logging.Console" Version="9.0.1" />
+    <PackageReference Include="Microsoft.Extensions.Logging.Console" Version="9.0.3" />
     <PackageReference Include="Microsoft.KernelMemory.Core" Version="0.97.250211.1" />
-    <PackageReference Include="Microsoft.SemanticKernel" Version="1.29.0" />
+    <PackageReference Include="Microsoft.SemanticKernel" Version="1.44.0" />
     <PackageReference Include="Microsoft.SemanticKernel.Plugins.Memory" Version="1.6.2-alpha" />
     <PackageReference Include="NAudio" Version="2.2.1" />
-    <PackageReference Include="SixLabors.ImageSharp" Version="3.1.5" />
+    <PackageReference Include="SixLabors.ImageSharp" Version="3.1.7" />
     <PackageReference Include="Spectre.Console" Version="0.49.1" />
     <PackageReference Include="Spectre.Console.ImageSharp" Version="0.49.1" />
     <PackageReference Include="Whisper.net" Version="1.7.4" />
-    <PackageReference Include="Whisper.net.Runtime" Version="1.7.2" />
+    <PackageReference Include="Whisper.net.Runtime" Version="1.7.4" />
     <PackageReference Include="Whisper.net.Runtime.Clblast" Version="1.5.0" />
     <PackageReference Include="Whisper.net.Runtime.CoreML" Version="1.7.4" />
     <PackageReference Include="Whisper.net.Runtime.Cublas" Version="1.5.0" />
 
@@ -4,7 +4,7 @@
     <TargetFrameworks>net8.0</TargetFrameworks>
     <ImplicitUsings>enable</ImplicitUsings>
     <Nullable>enable</Nullable>
-    <Version>0.21.0</Version>
+    <Version>0.22.0</Version>
     <Authors>Xbotter</Authors>
     <Company>SciSharp STACK</Company>
     <GeneratePackageOnBuild>true</GeneratePackageOnBuild>
@@ -27,7 +27,7 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.KernelMemory.Abstractions" Version="0.96.250120.1" />
+    <PackageReference Include="Microsoft.KernelMemory.Abstractions" Version="0.98.250323.1" />
   </ItemGroup>
 
   <ItemGroup>
 
@@ -33,9 +33,10 @@ public LLamaSharpTextEmbeddingGenerator(LLamaSharpConfig config)
             {
                 ContextSize = config.ContextSize,
                 GpuLayerCount = config.GpuLayerCount ?? 20,
-                Embeddings = true,
+
                 PoolingType = LLamaPoolingType.Mean,
             };
+
             _weights = LLamaWeights.LoadFromFile(@params);
             _embedder = new LLamaEmbedder(_weights, @params);
             _ownsWeights = true;
 
@@ -10,7 +10,7 @@
 		<ImplicitUsings>enable</ImplicitUsings>
 		<Nullable>enable</Nullable>
 
-		<Version>0.21.0</Version>
+		<Version>0.22.0</Version>
 		<Authors>Tim Miller, Xbotter</Authors>
 		<Company>SciSharp STACK</Company>
 		<GeneratePackageOnBuild>true</GeneratePackageOnBuild>
@@ -34,11 +34,11 @@
 	</PropertyGroup>
 
 	<ItemGroup>
-		<PackageReference Include="Microsoft.SemanticKernel.Abstractions" Version="1.39.0" />
+		<PackageReference Include="Microsoft.SemanticKernel.Abstractions" Version="1.44.0" />
 	</ItemGroup>
 
 	<ItemGroup Condition="'$(TargetFramework)' == 'netstandard2.0'">
-		<PackageReference Include="System.Memory" Version="4.6.0" PrivateAssets="all" />
+		<PackageReference Include="System.Memory" Version="4.6.2" PrivateAssets="all" />
 	</ItemGroup>
 
 	<ItemGroup>
 
@@ -22,7 +22,7 @@ public ITextTokenizerTests(ITestOutputHelper testOutputHelper)
             _testOutputHelper = testOutputHelper;
 
             _infParams = new() { AntiPrompts = ["\n\n"] };
-            _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams };
+            _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams, ContextSize = 512 };
 
             testOutputHelper.WriteLine($"Using model {Path.GetFileName(_lsConfig.ModelPath)}");
         }        
 
@@ -13,11 +13,11 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.12.0" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.13.0" />
     <PackageReference Include="Moq" Version="4.20.72" />
     <PackageReference Include="System.Linq.Async" Version="6.0.1" />
-    <PackageReference Include="xunit" Version="2.9.2" />
-    <PackageReference Include="xunit.runner.visualstudio" Version="3.0.0">
+    <PackageReference Include="xunit" Version="2.9.3" />
+    <PackageReference Include="xunit.runner.visualstudio" Version="3.0.2">
       <IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
       <PrivateAssets>all</PrivateAssets>
     </PackageReference>
 
@@ -14,6 +14,10 @@ public LLamaContextTests()
             var @params = new ModelParams(Constants.GenerativeModelPath2)
             {
                 ContextSize = 128,
+                BatchSize = 8,
+                UBatchSize = 8,
+                SeqMax = 1,
+                VocabOnly = false,
                 GpuLayerCount = Constants.CIGpuLayerCount,
             };
             _weights = LLamaWeights.LoadFromFile(@params);
@@ -84,6 +88,11 @@ public void TokenizeEmpty()
         [Fact]
         public void SaveLoadState()
         {
+            // Make sure there's something in the context worth saving
+            var batch = new LLamaBatch();
+            batch.Add(17, 0, LLamaSeqId.Zero, true);
+            _context.Decode(batch);
+
             using var state1 = _context.GetState();
 
             var stream = new MemoryStream();
@@ -99,6 +108,11 @@ public void SaveLoadState()
         [Fact]
         public async Task SaveLoadStateAsync()
         {
+            // Make sure there's something in the context worth saving
+            var batch = new LLamaBatch();
+            batch.Add(17, 0, LLamaSeqId.Zero, true);
+            _context.Decode(batch);
+
             using var state1 = _context.GetState();
 
             var stream = new MemoryStream();
 
@@ -45,8 +45,8 @@ private async Task CompareEmbeddings(string modelPath)
         var generator = (IEmbeddingGenerator<string, Embedding<float>>)embedder;
         Assert.NotNull(generator.GetService<EmbeddingGeneratorMetadata>());
         Assert.Equal(nameof(LLamaEmbedder), generator.GetService<EmbeddingGeneratorMetadata>()?.ProviderName);
-        Assert.NotNull(generator.GetService<EmbeddingGeneratorMetadata>()?.ModelId);
-        Assert.NotEmpty(generator.GetService<EmbeddingGeneratorMetadata>()?.ModelId!);
+        Assert.NotNull(generator.GetService<EmbeddingGeneratorMetadata>()?.DefaultModelId);
+        Assert.NotEmpty(generator.GetService<EmbeddingGeneratorMetadata>()?.DefaultModelId!);
         Assert.Same(embedder, generator.GetService<LLamaEmbedder>());
         Assert.Same(generator, generator.GetService<IEmbeddingGenerator<string, Embedding<float>>>());
         Assert.Null(generator.GetService<string>());
 
@@ -20,6 +20,6 @@ public class InferenceOptions
         public IReadOnlyList<string> AntiPrompts { get; set; } = Array.Empty<string>();
 
         /// <inheritdoc />
-        public required ISamplingPipeline SamplingPipeline { get; set; }
+        public ISamplingPipeline SamplingPipeline { get; set; } = new DefaultSamplingPipeline();
     }
 }
Original file line number	Diff line number	Diff line change
`@@ -22,7 +22,7 @@ public ITextTokenizerTests(ITestOutputHelper testOutputHelper)`
`22`	`22`	`_testOutputHelper = testOutputHelper;`
`23`	`23`
`24`	`24`	`_infParams = new() { AntiPrompts = ["\n\n"] };`
`25`		`- _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams };`
	`25`	`+ _lsConfig = new(Constants.GenerativeModelPath) { DefaultInferenceParams = _infParams, ContextSize = 512 };`
`26`	`26`
`27`	`27`	`testOutputHelper.WriteLine($"Using model {Path.GetFileName(_lsConfig.ModelPath)}");`
`28`	`28`	`}`
Original file line number	Diff line number	Diff line change
`@@ -20,6 +20,6 @@ public class InferenceOptions`
`20`	`20`	`public IReadOnlyList<string> AntiPrompts { get; set; } = Array.Empty<string>();`
`21`	`21`
`22`	`22`	`/// <inheritdoc />`
`23`		`- public required ISamplingPipeline SamplingPipeline { get; set; }`
	`23`	`+ public ISamplingPipeline SamplingPipeline { get; set; } = new DefaultSamplingPipeline();`
`24`	`24`	`}`
`25`	`25`	`}`