File tree Expand file tree Collapse file tree 2 files changed +7
-0
lines changed Expand file tree Collapse file tree 2 files changed +7
-0
lines changed Original file line number Diff line number Diff line change @@ -3883,6 +3883,11 @@ llama_context_recurrent::llama_context_recurrent(
3883
3883
llama_context_recurrent::~llama_context_recurrent () = default ;
3884
3884
3885
3885
void llama_context_recurrent::reserve () {
3886
+ // simulate full KV cache
3887
+ kv_self.n = kv_self.size ;
3888
+
3889
+ LLAMA_LOG_DEBUG (" %s: kv_self.n = %u\n " , __func__, kv_self.n );
3890
+
3886
3891
// TODO: implement recurrent-specific reserve logic
3887
3892
llama_context::reserve ();
3888
3893
}
Original file line number Diff line number Diff line change @@ -447,6 +447,7 @@ class llama_context_kv_self : public llama_context {
447
447
ggml_tensor * self_k_shift; // I32 [kv_size]
448
448
} inp;
449
449
450
+ protected:
450
451
//
451
452
// graph
452
453
//
@@ -570,6 +571,7 @@ class llama_context_recurrent : public llama_context {
570
571
ggml_tensor * s_mask; // F32 [1, n_kv]
571
572
} inp;
572
573
574
+ protected:
573
575
//
574
576
// graph
575
577
//
You can’t perform that action at this time.
0 commit comments