|
1 | 1 | //! A safe wrapper around `llama_model_params`. |
2 | 2 |
|
3 | | -use std::fmt::Debug; |
| 3 | +use crate::model::params::kv_overrides::KvOverrides; |
| 4 | +use std::ffi::{c_char, CStr}; |
| 5 | +use std::fmt::{Debug, Formatter}; |
| 6 | +use std::pin::Pin; |
| 7 | +use std::ptr::null; |
| 8 | + |
| 9 | +pub mod kv_overrides; |
4 | 10 |
|
5 | 11 | /// A safe wrapper around `llama_model_params`. |
| 12 | +/// |
| 13 | +/// [`T`] is the type of the backing storage for the key-value overrides. Generally it can be left to [`()`] which will |
| 14 | +/// make your life with the borrow checker much easier. |
6 | 15 | #[allow(clippy::module_name_repetitions)] |
7 | | -#[derive(Debug)] |
8 | 16 | pub struct LlamaModelParams { |
9 | 17 | pub(crate) params: llama_cpp_sys_2::llama_model_params, |
| 18 | + kv_overrides: Vec<llama_cpp_sys_2::llama_model_kv_override>, |
| 19 | +} |
| 20 | + |
| 21 | +impl Debug for LlamaModelParams { |
| 22 | + fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result { |
| 23 | + f.debug_struct("LlamaModelParams") |
| 24 | + .field("n_gpu_layers", &self.params.n_gpu_layers) |
| 25 | + .field("main_gpu", &self.params.main_gpu) |
| 26 | + .field("vocab_only", &self.params.vocab_only) |
| 27 | + .field("use_mmap", &self.params.use_mmap) |
| 28 | + .field("use_mlock", &self.params.use_mlock) |
| 29 | + .field("kv_overrides", &"vec of kv_overrides") |
| 30 | + .finish() |
| 31 | + } |
| 32 | +} |
| 33 | + |
| 34 | +impl LlamaModelParams { |
| 35 | + /// See [`KvOverrides`] |
| 36 | + /// |
| 37 | + /// # Examples |
| 38 | + /// |
| 39 | + /// ```rust |
| 40 | + /// # use llama_cpp_2::model::params::LlamaModelParams; |
| 41 | + /// let params = Box::pin(LlamaModelParams::default()); |
| 42 | + /// let kv_overrides = params.kv_overrides(); |
| 43 | + /// let count = kv_overrides.into_iter().count(); |
| 44 | + /// assert_eq!(count, 0); |
| 45 | + /// ``` |
| 46 | + #[must_use] |
| 47 | + pub fn kv_overrides(&self) -> KvOverrides { |
| 48 | + KvOverrides::new(self) |
| 49 | + } |
| 50 | + |
| 51 | + /// Appends a key-value override to the model parameters. It must be pinned as this creates a self-referential struct. |
| 52 | + /// |
| 53 | + /// # Examples |
| 54 | + /// |
| 55 | + /// ```rust |
| 56 | + /// # use std::ffi::{CStr, CString}; |
| 57 | + /// use std::pin::pin; |
| 58 | + /// # use llama_cpp_2::model::params::LlamaModelParams; |
| 59 | + /// # use llama_cpp_2::model::params::kv_overrides::ParamOverrideValue; |
| 60 | + /// let mut params = pin!(LlamaModelParams::default()); |
| 61 | + /// let key = CString::new("key").expect("CString::new failed"); |
| 62 | + /// params.append_kv_override(&key, ParamOverrideValue::Int(50)); |
| 63 | + /// |
| 64 | + /// let kv_overrides = params.kv_overrides().into_iter().collect::<Vec<_>>(); |
| 65 | + /// assert_eq!(kv_overrides.len(), 1); |
| 66 | + /// |
| 67 | + /// let (k, v) = &kv_overrides[0]; |
| 68 | + /// assert_eq!(v, &ParamOverrideValue::Int(50)); |
| 69 | + /// |
| 70 | + /// assert_eq!(k.to_bytes(), b"key", "expected key to be 'key', was {:?}", k); |
| 71 | + /// ``` |
| 72 | + #[allow(clippy::missing_panics_doc)] // panics are just to enforce internal invariants, not user errors |
| 73 | + pub fn append_kv_override( |
| 74 | + self: &mut Pin<&mut Self>, |
| 75 | + key: &CStr, |
| 76 | + value: kv_overrides::ParamOverrideValue, |
| 77 | + ) { |
| 78 | + let kv_override = self |
| 79 | + .kv_overrides |
| 80 | + .get_mut(0) |
| 81 | + .expect("kv_overrides did not have a next allocated"); |
| 82 | + |
| 83 | + assert_eq!(kv_override.key[0], 0, "last kv_override was not empty"); |
| 84 | + |
| 85 | + // There should be some way to do this without iterating over everything. |
| 86 | + for (i, &c) in key.to_bytes_with_nul().iter().enumerate() { |
| 87 | + kv_override.key[i] = c_char::try_from(c).expect("invalid character in key"); |
| 88 | + } |
| 89 | + |
| 90 | + kv_override.tag = value.tag(); |
| 91 | + kv_override.__bindgen_anon_1 = value.value(); |
| 92 | + |
| 93 | + // set to null pointer for panic safety (as push may move the vector, invalidating the pointer) |
| 94 | + self.params.kv_overrides = null(); |
| 95 | + |
| 96 | + // push the next one to ensure we maintain the iterator invariant of ending with a 0 |
| 97 | + self.kv_overrides |
| 98 | + .push(llama_cpp_sys_2::llama_model_kv_override { |
| 99 | + key: [0; 128], |
| 100 | + tag: 0, |
| 101 | + __bindgen_anon_1: llama_cpp_sys_2::llama_model_kv_override__bindgen_ty_1 { |
| 102 | + int_value: 0, |
| 103 | + }, |
| 104 | + }); |
| 105 | + |
| 106 | + // set the pointer to the (potentially) new vector |
| 107 | + self.params.kv_overrides = self.kv_overrides.as_ptr(); |
| 108 | + |
| 109 | + eprintln!("saved ptr: {:?}", self.params.kv_overrides); |
| 110 | + } |
10 | 111 | } |
11 | 112 |
|
12 | 113 | impl LlamaModelParams { |
@@ -90,8 +191,16 @@ impl LlamaModelParams { |
90 | 191 | /// ``` |
91 | 192 | impl Default for LlamaModelParams { |
92 | 193 | fn default() -> Self { |
| 194 | + let default_params = unsafe { llama_cpp_sys_2::llama_model_default_params() }; |
93 | 195 | LlamaModelParams { |
94 | | - params: unsafe { llama_cpp_sys_2::llama_model_default_params() }, |
| 196 | + params: default_params, |
| 197 | + kv_overrides: vec![llama_cpp_sys_2::llama_model_kv_override { |
| 198 | + key: [0; 128], |
| 199 | + tag: 0, |
| 200 | + __bindgen_anon_1: llama_cpp_sys_2::llama_model_kv_override__bindgen_ty_1 { |
| 201 | + int_value: 0, |
| 202 | + }, |
| 203 | + }], |
95 | 204 | } |
96 | 205 | } |
97 | 206 | } |
0 commit comments