File tree
6 files changed
+9
-9
lines changed- examples
- embeddings
- simple
- llama-cpp-2
- llama-cpp-sys-2
6 files changed
+9
-9
lines changedLines changed: 4 additions & 4 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
1 | 1 |
| |
2 | 2 |
| |
3 |
| - | |
| 3 | + | |
4 | 4 |
| |
5 | 5 |
| |
6 | 6 |
| |
|
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
1 | 1 |
| |
2 | 2 |
| |
3 |
| - | |
| 3 | + | |
4 | 4 |
| |
5 | 5 |
| |
6 | 6 |
| |
|
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
1 | 1 |
| |
2 | 2 |
| |
3 | 3 |
| |
4 |
| - | |
| 4 | + | |
5 | 5 |
| |
6 | 6 |
| |
7 | 7 |
| |
|
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
1 | 1 |
| |
2 | 2 |
| |
3 | 3 |
| |
4 |
| - | |
| 4 | + | |
5 | 5 |
| |
6 | 6 |
| |
7 | 7 |
| |
|
- .devops/musa.Dockerfile+3-3
- .devops/rocm.Dockerfile+2-2
- .github/workflows/build.yml+1-1
- .github/workflows/close-issue.yml+1-1
- README.md-1
- ci/README.md+1-1
- common/arg.cpp+8-1
- common/common.h+4-3
- convert_hf_to_gguf.py+12-4
- docs/build-s390x.md+38-8
- docs/build.md+3
- docs/development/HOWTO-add-model.md+15-6
- docs/docker.md+1-1
- docs/ops.md+12-4
- docs/ops/CPU.csv+7.3k-6.5k
- docs/ops/CUDA.csv+7.3k-6.5k
- ggml/CMakeLists.txt+3-1
- ggml/cmake/ggml-config.cmake.in+85-47
- ggml/src/ggml-backend.cpp+8-5
- ggml/src/ggml-cann/acl_tensor.cpp+3-1
- ggml/src/ggml-cann/aclnn_ops.cpp+58-3
- ggml/src/ggml-cann/aclnn_ops.h+130-22
- ggml/src/ggml-cann/ggml-cann.cpp+121-16
- ggml/src/ggml-cpu/CMakeLists.txt+5-2
- ggml/src/ggml-cpu/arch/loongarch/quants.c+1-1
- ggml/src/ggml-cpu/kleidiai/kernels.cpp+109-12
- ggml/src/ggml-cpu/kleidiai/kernels.h+3
- ggml/src/ggml-cpu/kleidiai/kleidiai.cpp+88-10
- ggml/src/ggml-cpu/repack.cpp-1
- ggml/src/ggml-cuda/CMakeLists.txt+3-3
- ggml/src/ggml-cuda/common.cuh+14-4
- ggml/src/ggml-cuda/convert.cu+64-17
- ggml/src/ggml-cuda/cpy-utils.cuh+10-36
- ggml/src/ggml-cuda/cpy.cu+40-63
- ggml/src/ggml-cuda/fattn-common.cuh+54-52
- ggml/src/ggml-cuda/fattn-mma-f16.cuh+25-46
- ggml/src/ggml-cuda/fattn-tile-f16.cu+10-31
- ggml/src/ggml-cuda/fattn-tile-f32.cu+25-46
- ggml/src/ggml-cuda/fattn-vec-f16.cuh+27-41
- ggml/src/ggml-cuda/fattn-vec-f32.cuh+18-33
- ggml/src/ggml-cuda/fattn-wmma-f16.cu+9-30
- ggml/src/ggml-cuda/fattn.cu+3-13
- ggml/src/ggml-cuda/ggml-cuda.cu+45-14
- ggml/src/ggml-cuda/im2col.cu+1-1
- ggml/src/ggml-cuda/mma.cuh+111-3
- ggml/src/ggml-cuda/mmq.cu+6-4
- ggml/src/ggml-cuda/mmq.cuh+1.2k-689
- ggml/src/ggml-cuda/norm.cu+92-5
- ggml/src/ggml-cuda/norm.cuh+2
- ggml/src/ggml-cuda/set-rows.cu+5-18
- ggml/src/ggml-cuda/vendors/hip.h+13-1
- ggml/src/ggml-cuda/vendors/musa.h+2-2
- ggml/src/ggml-metal/ggml-metal-impl.h+1
- ggml/src/ggml-metal/ggml-metal.m+23-5
- ggml/src/ggml-metal/ggml-metal.metal+142-40
- ggml/src/ggml-musa/CMakeLists.txt+18-4
- ggml/src/ggml-opencl/CMakeLists.txt+2
- ggml/src/ggml-opencl/ggml-opencl.cpp+294-2
- ggml/src/ggml-opencl/kernels/conv2d.cl+185
- ggml/src/ggml-opencl/kernels/conv2d_f16_f32.cl+176
- ggml/src/ggml-opencl/kernels/im2col_f16.cl+1-1
- ggml/src/ggml-opencl/kernels/im2col_f32.cl+1-1
- ggml/src/ggml-opencl/kernels/rms_norm.cl+79
- ggml/src/ggml-rpc/ggml-rpc.cpp+4-4
- ggml/src/ggml-sycl/ggml-sycl.cpp+1-1
- ggml/src/ggml-sycl/im2col.cpp+1-1
- ggml/src/ggml-sycl/quants.hpp+8-9
- ggml/src/ggml-sycl/vecdotq.hpp+2-6
- ggml/src/ggml-vulkan/ggml-vulkan.cpp+27-6
- ggml/src/ggml-vulkan/vulkan-shaders/im2col.comp+2-4
- ggml/src/ggml-vulkan/vulkan-shaders/rms_norm.comp+8-2
- ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp+1
- ggml/src/ggml.c+4-6
- gguf-py/gguf/metadata.py+4
- include/llama.h+2
- scripts/create_ops_docs.py+5
- scripts/sync-ggml.last+1-1
- src/llama-arch.cpp+6-6
- src/llama-chat.cpp+3-4
- src/llama-context.cpp+49-14
- src/llama-context.h+13
- src/llama-hparams.h+1-1
- src/llama-memory-recurrent.cpp+15
- src/llama-model.cpp+28-10
- tests/test-backend-ops.cpp+79-26
- tools/export-lora/export-lora.cpp+1-1
- tools/imatrix/README.md+72-14
- tools/imatrix/imatrix.cpp+256-5
- tools/main/main.cpp+10-7
- tools/mtmd/clip.cpp+15-6
- tools/server/server.cpp+5
0 commit comments