refactor: rename *_is_hybrid -> *_is_hybrid_recurrent

gabe-l-hart · gabe-l-hart · commit 704a0a858ad9 · 2025-05-20T15:03:30.000-06:00
The implementation of the hybrid cache intentionally does not specify the
types of the child caches, so there was a naming mismatch with these
predicate functions that used "hybrid" to imply "hybrid recurrent."

Branch: HybridCache

Signed-off-by: Gabe Goodhart &lt;ghart@us.ibm.com&gt;
diff --git a/include/llama.h b/include/llama.h
@@ -554,7 +554,7 @@ extern "C" {
     LLAMA_API bool llama_model_is_recurrent(const struct llama_model * model);
 
     // Returns true if the model is hybrid-recurrent (like Jamba, Bamba, etc.)
-    LLAMA_API bool llama_model_is_hybrid(const struct llama_model * model);
+    LLAMA_API bool llama_model_is_hybrid_recurrent(const struct llama_model * model);
 
     // Returns 0 on success
     LLAMA_API uint32_t llama_model_quantize(
diff --git a/src/llama-arch.cpp b/src/llama-arch.cpp
@@ -1759,7 +1759,7 @@ bool llm_arch_is_recurrent(const llm_arch & arch) {
     }
 }
 
-bool llm_arch_is_hybrid(const llm_arch & arch) {
+bool llm_arch_is_hybrid_recurrent(const llm_arch & arch) {
     // TODO: There are currently no hybrid models! Once there are, this will be
     //  the place to identify them
     switch (arch) {
diff --git a/src/llama-arch.h b/src/llama-arch.h
@@ -438,4 +438,4 @@ llm_arch llm_arch_from_string(const std::string & name);
 const llm_tensor_info & llm_tensor_info_for(llm_tensor tensor);
 
 bool llm_arch_is_recurrent(const llm_arch& arch);
-bool llm_arch_is_hybrid(const llm_arch& arch);
+bool llm_arch_is_hybrid_recurrent(const llm_arch& arch);
diff --git a/src/llama-model.cpp b/src/llama-model.cpp
@@ -13208,7 +13208,7 @@ llama_memory_i * llama_model::create_memory(const llama_memory_params & params,
         // checks
         default:
             {
-                if (llm_arch_is_hybrid(arch)) {
+                if (llm_arch_is_hybrid_recurrent(arch)) {
                     // make vectors of recurrent and non-recurrent layer indices
                     std::vector<size_t> recurrent_layers;
                     std::vector<size_t> unified_layers;
@@ -13848,8 +13848,8 @@ bool llama_model_is_recurrent(const llama_model * model) {
     return llm_arch_is_recurrent(model->arch);
 }
 
-bool llama_model_is_hybrid(const llama_model * model) {
-    return llm_arch_is_hybrid(model->arch);
+bool llama_model_is_hybrid_recurrent(const llama_model * model) {
+    return llm_arch_is_hybrid_recurrent(model->arch);
 }
 
 const std::vector<std::pair<std::string, ggml_tensor *>> & llama_internal_get_tensor_map(const llama_model * model) {

Original file line number	Diff line number	Diff line change
`@@ -1759,7 +1759,7 @@ bool llm_arch_is_recurrent(const llm_arch & arch) {`
`1759`	`1759`	`}`
`1760`	`1760`	`}`
`1761`	`1761`
`1762`		`-bool llm_arch_is_hybrid(const llm_arch & arch) {`
	`1762`	`+bool llm_arch_is_hybrid_recurrent(const llm_arch & arch) {`
`1763`	`1763`	`// TODO: There are currently no hybrid models! Once there are, this will be`
`1764`	`1764`	`// the place to identify them`
`1765`	`1765`	`switch (arch) {`
Original file line number	Diff line number	Diff line change
`@@ -13208,7 +13208,7 @@ llama_memory_i * llama_model::create_memory(const llama_memory_params & params,`
`13208`	`13208`	`// checks`
`13209`	`13209`	`default:`
`13210`	`13210`	`{`
`13211`		`- if (llm_arch_is_hybrid(arch)) {`
	`13211`	`+ if (llm_arch_is_hybrid_recurrent(arch)) {`
`13212`	`13212`	`// make vectors of recurrent and non-recurrent layer indices`
`13213`	`13213`	`std::vector<size_t> recurrent_layers;`
`13214`	`13214`	`std::vector<size_t> unified_layers;`
`@@ -13848,8 +13848,8 @@ bool llama_model_is_recurrent(const llama_model * model) {`
`13848`	`13848`	`return llm_arch_is_recurrent(model->arch);`
`13849`	`13849`	`}`
`13850`	`13850`
`13851`		`-bool llama_model_is_hybrid(const llama_model * model) {`
`13852`		`- return llm_arch_is_hybrid(model->arch);`
	`13851`	`+bool llama_model_is_hybrid_recurrent(const llama_model * model) {`
	`13852`	`+ return llm_arch_is_hybrid_recurrent(model->arch);`
`13853`	`13853`	`}`
`13854`	`13854`
`13855`	`13855`	`const std::vector<std::pair<std::string, ggml_tensor >> & llama_internal_get_tensor_map(const llama_model model) {`