@@ -311,9 +311,9 @@ static buft_list_t make_gpu_buft_list(ggml_backend_dev_t dev, enum llama_split_m
311311 ggml_backend_reg_get_proc_address (reg, " ggml_backend_split_buffer_type" );
312312 if (ggml_backend_split_buffer_type_fn) {
313313 size_t dev_index = [&]() {
314- auto * reg = ggml_backend_dev_backend_reg (dev);
315- for (size_t i = 0 ; i < ggml_backend_reg_dev_count (reg ); ++i) {
316- if (ggml_backend_reg_dev_get (reg , i) == dev) {
314+ ggml_backend_reg_t reg_dev = ggml_backend_dev_backend_reg (dev);
315+ for (size_t i = 0 ; i < ggml_backend_reg_dev_count (reg_dev ); ++i) {
316+ if (ggml_backend_reg_dev_get (reg_dev , i) == dev) {
317317 return i;
318318 }
319319 }
@@ -1304,7 +1304,7 @@ bool llama_model::load_tensors(llama_model_loader & ml) {
13041304 const int act_gpu_layers = devices.empty () ? 0 : std::min (n_gpu_layers, (int )n_layer + 1 );
13051305 auto get_layer_buft_list = [&](int il) -> llama_model::impl::layer_dev {
13061306 if (il < i_gpu_start || (il - i_gpu_start) >= act_gpu_layers) {
1307- return {cpu_dev, &pimpl->cpu_buft_list };
1307+ return { cpu_dev, &pimpl->cpu_buft_list };
13081308 }
13091309 const int layer_gpu = std::upper_bound (splits.begin (), splits.begin () + n_devices (), float (il - i_gpu_start)/act_gpu_layers) - splits.begin ();
13101310 auto * dev = devices.at (layer_gpu);
@@ -1453,7 +1453,6 @@ bool llama_model::load_tensors(llama_model_loader & ml) {
14531453 // avoid using a host buffer when using mmap
14541454 auto * buft_dev = ggml_backend_buft_get_device (buft);
14551455 if (ml.use_mmap && buft_dev && buft == ggml_backend_dev_host_buffer_type (buft_dev)) {
1456- auto * cpu_dev = ggml_backend_dev_by_type (GGML_BACKEND_DEVICE_TYPE_CPU);
14571456 buft = ggml_backend_dev_buffer_type (cpu_dev);
14581457 }
14591458
@@ -3697,8 +3696,8 @@ ggml_backend_buffer_type_t llama_model::select_buft(int il) const {
36973696
36983697const struct ggml_tensor * llama_model::get_tensor (const char * name) const {
36993698 auto it = std::find_if (tensors_by_name.begin (), tensors_by_name.end (),
3700- [name](const std::pair<std::string, struct ggml_tensor *> & it ) {
3701- return it .first == name;
3699+ [name](const std::pair<std::string, struct ggml_tensor *> & entry ) {
3700+ return entry .first == name;
37023701 });
37033702 if (it == tensors_by_name.end ()) {
37043703 return nullptr ;
0 commit comments