fix: sampler vocab size. (#241)

b4rtaz · web-flow · commit a70dd6fb4bb0 · 2025-08-10T00:32:54.000+02:00
diff --git a/src/app.cpp b/src/app.cpp
@@ -234,9 +234,9 @@ void runInferenceApp(AppCliArgs *args, void (*handler)(AppInferenceContext *cont
 
     Tokenizer tokenizer(args->tokenizerPath);
     if (tokenizer.vocabSize != header.vocabSize)
-        printf("Tokenizer vocab size does not match the model vocab size: %d != %d\n", tokenizer.vocabSize, header.vocabSize);
+        printf("Tokenizer vocab size (%d) does not match the model vocab size (%d)\n", tokenizer.vocabSize, header.vocabSize);
 
-    Sampler sampler(header.vocabSize, args->temperature, args->topp, args->seed);
+    Sampler sampler(tokenizer.vocabSize, args->temperature, args->topp, args->seed);
 
     LlmNet net = buildLlmNet(&header, nNodes, args->nBatches);
     std::unique_ptr<LlmNet, void(*)(LlmNet *)> netPtr(&net, releaseLlmNet);
diff --git a/src/nn/nn-vulkan-test.cpp b/src/nn/nn-vulkan-test.cpp
@@ -421,7 +421,6 @@ void testCast_F32_Q80() {
             for (NnUint i = 0; i < N_BATCHES * dim; i++) {
                 const float expectedV = (float)(i + 1);
                 const float change = (yF32[i] - expectedV) / expectedV;
-                printf("cast %f %f\n", expectedV, yF32[i]);
                 assertFloat(i, change, 0.0, 0.009f);
             }
             printOk("testCast_F32_Q80");

Original file line number	Diff line number	Diff line change
`@@ -421,7 +421,6 @@ void testCast_F32_Q80() {`
`421`	`421`	`for (NnUint i = 0; i < N_BATCHES * dim; i++) {`
`422`	`422`	`const float expectedV = (float)(i + 1);`
`423`	`423`	`const float change = (yF32[i] - expectedV) / expectedV;`
`424`		`- printf("cast %f %f\n", expectedV, yF32[i]);`
`425`	`424`	`assertFloat(i, change, 0.0, 0.009f);`
`426`	`425`	`}`
`427`	`426`	`printOk("testCast_F32_Q80");`