Reduce log level of a debug message leaking prompt contents

l-austenfeld · l-austenfeld · commit 7e3b260f4f03 · 2025-10-22T22:00:45.000+02:00
diff --git a/tools/server/server.cpp b/tools/server/server.cpp
@@ -3818,7 +3818,7 @@ struct server_context {
 
                                 // when the prompt prefix does not match, print the tokens around the mismatch
                                 // this is useful for debugging prompt caching
-                                {
+                                if (GGML_LOG_LEVEL_DEBUG <= common_log_verbosity_thold) {
                                     const int np0 = std::max<int>(slot.n_past - 4, 0);
                                     const int np1 = std::min<int>(slot.n_past + 6, std::min(slot.prompt.tokens.size(), slot.task->tokens.size()));
 
@@ -3852,11 +3852,11 @@ struct server_context {
                                         }
                                     }
 
-                                    SLT_WRN(slot, "%s\n", ss0.str().c_str());
-                                    SLT_WRN(slot, "%s\n", ss1.str().c_str());
+                                    SLT_DBG(slot, "%s\n", ss0.str().c_str());
+                                    SLT_DBG(slot, "%s\n", ss1.str().c_str());
 
-                                    SLT_WRN(slot, "%s\n", st0.str().c_str());
-                                    SLT_WRN(slot, "%s\n", st1.str().c_str());
+                                    SLT_DBG(slot, "%s\n", st0.str().c_str());
+                                    SLT_DBG(slot, "%s\n", st1.str().c_str());
                                 }
 
                                 if (pos_min > pos_min_thold) {

Original file line number	Diff line number	Diff line change
`@@ -3818,7 +3818,7 @@ struct server_context {`
`3818`	`3818`
`3819`	`3819`	`// when the prompt prefix does not match, print the tokens around the mismatch`
`3820`	`3820`	`// this is useful for debugging prompt caching`
`3821`		`- {`
	`3821`	`+ if (GGML_LOG_LEVEL_DEBUG <= common_log_verbosity_thold) {`
`3822`	`3822`	`const int np0 = std::max<int>(slot.n_past - 4, 0);`
`3823`	`3823`	`const int np1 = std::min<int>(slot.n_past + 6, std::min(slot.prompt.tokens.size(), slot.task->tokens.size()));`
`3824`	`3824`
`@@ -3852,11 +3852,11 @@ struct server_context {`
`3852`	`3852`	`}`
`3853`	`3853`	`}`
`3854`	`3854`
`3855`		`- SLT_WRN(slot, "%s\n", ss0.str().c_str());`
`3856`		`- SLT_WRN(slot, "%s\n", ss1.str().c_str());`
	`3855`	`+ SLT_DBG(slot, "%s\n", ss0.str().c_str());`
	`3856`	`+ SLT_DBG(slot, "%s\n", ss1.str().c_str());`
`3857`	`3857`
`3858`		`- SLT_WRN(slot, "%s\n", st0.str().c_str());`
`3859`		`- SLT_WRN(slot, "%s\n", st1.str().c_str());`
	`3858`	`+ SLT_DBG(slot, "%s\n", st0.str().c_str());`
	`3859`	`+ SLT_DBG(slot, "%s\n", st1.str().c_str());`
`3860`	`3860`	`}`
`3861`	`3861`
`3862`	`3862`	`if (pos_min > pos_min_thold) {`