Merge pull request #689 from vlovich/expose-head-n-kv

MarcusDunn · web-flow · commit 209ad8666286 · 2025-03-03T09:48:56.000-08:00
Expose n_head_kv
diff --git a/llama-cpp-2/src/model.rs b/llama-cpp-2/src/model.rs
@@ -484,6 +484,13 @@ impl LlamaModel {
         u32::try_from(unsafe { llama_cpp_sys_2::llama_model_n_head(self.model.as_ptr()) }).unwrap()
     }
 
+    /// Returns the number of KV attention heads.
+    pub fn n_head_kv(&self) -> u32 {
+        // It's never possible for this to panic because while the API interface is defined as an int32_t,
+        // the field it's accessing is a uint32_t.
+        u32::try_from(unsafe { llama_cpp_sys_2::llama_model_n_head_kv(self.model.as_ptr()) }).unwrap()
+    }
+
     /// Returns the rope type of the model.
     pub fn rope_type(&self) -> Option<RopeType> {
         match unsafe { llama_cpp_sys_2::llama_model_rope_type(self.model.as_ptr()) } {
diff --git a/llama-cpp-sys-2/llama.cpp b/llama-cpp-sys-2/llama.cpp
@@ -1 +1 @@
-Subproject commit 300907b2110cc17b4337334dc397e05de2d8f5e0
+Subproject commit 06c2b1561d8b882bc018554591f8c35eb04ad30e