fix code and instructions

dbsanfte · dbsanfte · commit febdec38cb76 · 2025-08-01T09:27:17.000Z
diff --git a/.github/copilot-instructions.md b/.github/copilot-instructions.md
@@ -25,27 +25,17 @@ This is a fork of llama.cpp with **NUMA-aware improvements** for better CPU thre
 
 ```bash
 # Manual build steps
-cmake -B build -DCMAKE_BUILD_TYPE=Release -DCMAKE_EXPORT_COMPILE_COMMANDS=ON
+cmake -B build -DCMAKE_BUILD_TYPE=Release -DCMAKE_EXPORT_COMPILE_COMMANDS=ON -DGGML_NUMA_MIRROR=ON
 cmake --build build --parallel $(nproc)
 
 # Debug build
-cmake -B build -DCMAKE_BUILD_TYPE=Debug -DCMAKE_EXPORT_COMPILE_COMMANDS=ON
+cmake -B build -DCMAKE_BUILD_TYPE=Debug -DCMAKE_EXPORT_COMPILE_COMMANDS=ON -DGGML_NUMA_MIRROR=ON
 cmake --build build --parallel $(nproc)
 
 # Run tests
 ctest --list --output-on-failure
 ```
 
-### Available VS Code Tasks
-
-- **Ctrl+Shift+P** → "Tasks: Run Task":
-  - `cmake-configure` - Configure CMake
-  - `cmake-build` - Build project (default)
-  - `cmake-release` - Release build
-  - `cmake-clean` - Clean build directory
-  - `test-cpu-topology` - Test CPU topology detection
-  - `check-numa` - Display NUMA hardware info
-
 ## 🧠 Key Areas of Focus
 
 ### 1. NUMA Memory Management
diff --git a/src/llama-model-loader.cpp b/src/llama-model-loader.cpp
@@ -927,7 +927,7 @@ void llama_model_loader::get_mapping_range(size_t * first, size_t * last, void *
         // Calculate the offset for this file within the unified mapping
         size_t file_offset = 0;
         for (int i = 0; i < idx; ++i) {
-            file_offset += files[i]->size;
+            file_offset += files[i]->size();
         }
         
         *first = mapping->size();  // Start with full mapping size
@@ -946,10 +946,10 @@ void llama_model_loader::get_mapping_range(size_t * first, size_t * last, void *
         
         // Adjust first and last to be relative to this file's start
         if (*first != mapping->size()) {
-            *first = std::min(*first, files[idx]->size);
+            *first = std::min(*first, files[idx]->size());
         }
         if (*last != 0) {
-            *last = std::min(*last, files[idx]->size);
+            *last = std::min(*last, files[idx]->size());
         }
     } else {
 #endif
@@ -984,7 +984,7 @@ void llama_model_loader::load_data_for(struct ggml_tensor * cur) const {
             // For unified mapping, calculate offset within the unified mapping
             size_t unified_offset = w.offs;
             for (int i = 0; i < w.idx; ++i) {
-                unified_offset += files[i]->size;
+                unified_offset += files[i]->size();
             }
             
             const auto & mapping = mappings[0];