Skip to content

Commit d7c8669

Browse files
authored
fix: temporarily pin to a working llama.cpp release
1 parent 1c03fef commit d7c8669

File tree

2 files changed

+8
-3
lines changed

2 files changed

+8
-3
lines changed

.github/workflows/build.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,8 @@ jobs:
2323
- name: Download latest llama.cpp release
2424
env:
2525
CI: true
26-
# pinned to `b4357` temporarily until the Windows on Arm64 build is fixed
27-
run: node ./dist/cli/cli.js source download --release b4357 --skipBuild --noBundle --noUsageExample --updateBinariesReleaseMetadataAndSaveGitBundle
26+
# pinned to `b4333` temporarily until the Windows on Arm64 build is fixed
27+
run: node ./dist/cli/cli.js source download --release b4333 --skipBuild --noBundle --noUsageExample --updateBinariesReleaseMetadataAndSaveGitBundle
2828
- name: Upload build artifact
2929
uses: actions/upload-artifact@v4
3030
with:

llama/addon/AddonSampler.cpp

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -350,10 +350,15 @@ Napi::Value AddonSampler::ApplyConfig(const Napi::CallbackInfo& info) {
350350

351351
if (shouldCreateSampler) {
352352
repeatPenaltySampler = llama_sampler_init_penalties(
353+
llama_n_vocab(model->model),
354+
llama_token_eos(model->model),
355+
llama_token_nl(model->model),
353356
repeatPenaltyMaxTokens,
354357
repeatPenalty,
355358
repeatPenaltyFrequencyPenalty,
356-
repeatPenaltyPresencePenalty
359+
repeatPenaltyPresencePenalty,
360+
true,
361+
false
357362
);
358363
repeatPenalty_lastTokens = RingBuffer<llama_token>(repeatPenaltyMaxTokens);
359364

0 commit comments

Comments
 (0)