llama : fix llama_decode return code when could not find KV slot

ggerganov · ggerganov · commit 2c41dffcc72a · 2025-04-02T13:41:15.000+03:00
ggml-ci
diff --git a/examples/parallel/parallel.cpp b/examples/parallel/parallel.cpp
@@ -106,6 +106,8 @@ int main(int argc, char ** argv) {
 
     common_params params;
 
+    params.n_predict = 128;
+
     if (!common_params_parse(argc, argv, params, LLAMA_EXAMPLE_PARALLEL)) {
         return 1;
     }
diff --git a/src/llama-context.cpp b/src/llama-context.cpp
@@ -1298,7 +1298,7 @@ int llama_context::decode(llama_batch & inp_batch) {
         {
             if (!kv_self->find_slot(ubatch)) {
                 LLAMA_LOG_ERROR("%s: failed to prepare ubatch\n", __func__);
-                return -3;
+                return 1;
             }
 
             if (!kv_self->recurrent) {
diff --git a/src/llama-kv-cache.cpp b/src/llama-kv-cache.cpp
@@ -204,6 +204,8 @@ bool llama_kv_cache_unified::seq_rm(llama_seq_id seq_id, llama_pos p0, llama_pos
                 return false;
             }
         }
+
+        return true;
     }
 
     for (uint32_t i = 0; i < size; ++i) {

Original file line number	Diff line number	Diff line change
`@@ -106,6 +106,8 @@ int main(int argc, char ** argv) {`
`106`	`106`
`107`	`107`	`common_params params;`
`108`	`108`
	`109`	`+ params.n_predict = 128;`
	`110`	`+`
`109`	`111`	`if (!common_params_parse(argc, argv, params, LLAMA_EXAMPLE_PARALLEL)) {`
`110`	`112`	`return 1;`
`111`	`113`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1298,7 +1298,7 @@ int llama_context::decode(llama_batch & inp_batch) {`
`1298`	`1298`	`{`
`1299`	`1299`	`if (!kv_self->find_slot(ubatch)) {`
`1300`	`1300`	`LLAMA_LOG_ERROR("%s: failed to prepare ubatch\n", __func__);`
`1301`		`- return -3;`
	`1301`	`+ return 1;`
`1302`	`1302`	`}`
`1303`	`1303`
`1304`	`1304`	`if (!kv_self->recurrent) {`
Original file line number	Diff line number	Diff line change
`@@ -204,6 +204,8 @@ bool llama_kv_cache_unified::seq_rm(llama_seq_id seq_id, llama_pos p0, llama_pos`
`204`	`204`	`return false;`
`205`	`205`	`}`
`206`	`206`	`}`
	`207`	`+`
	`208`	`+ return true;`
`207`	`209`	`}`
`208`	`210`
`209`	`211`	`for (uint32_t i = 0; i < size; ++i) {`