Commit 4b66c45
authored
feat: update llama.cpp to 210a6570c (abetlen#2242)
1 parent a9b480f commit 4b66c45
3 files changed
Lines changed: 6 additions & 1 deletion
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
7 | 7 | | |
8 | 8 | | |
9 | 9 | | |
| 10 | + | |
10 | 11 | | |
11 | 12 | | |
12 | 13 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
903 | 903 | | |
904 | 904 | | |
905 | 905 | | |
| 906 | + | |
906 | 907 | | |
907 | 908 | | |
908 | 909 | | |
| |||
958 | 959 | | |
959 | 960 | | |
960 | 961 | | |
| 962 | + | |
961 | 963 | | |
962 | 964 | | |
963 | 965 | | |
| |||
995 | 997 | | |
996 | 998 | | |
997 | 999 | | |
| 1000 | + | |
998 | 1001 | | |
999 | 1002 | | |
1000 | 1003 | | |
| |||
1031 | 1034 | | |
1032 | 1035 | | |
1033 | 1036 | | |
| 1037 | + | |
1034 | 1038 | | |
1035 | 1039 | | |
1036 | 1040 | | |
| |||
- .devops/nix/package.nix+28-1
- .github/workflows/build-self-hosted.yml+1-1
- .github/workflows/server.yml-3
- SECURITY.md+5-5
- common/arg.cpp-4
- common/common.cpp+1
- common/common.h+1
- common/reasoning-budget.cpp+21
- common/reasoning-budget.h+4
- common/sampling.cpp+8
- common/sampling.h+3
- common/speculative.cpp+34-12
- common/speculative.h+3
- conversion/__init__.py+2
- conversion/base.py+1-1
- conversion/exaone.py+97-2
- docs/backend/SYCL.md+1-1
- docs/ops.md+1-1
- docs/ops/SYCL.csv+2.0k-1.6k
- ggml/include/ggml-backend.h+7-3
- ggml/src/ggml-backend-meta.cpp+142-136
- ggml/src/ggml-metal/ggml-metal-device.m+1-1
- ggml/src/ggml-metal/ggml-metal.metal+66-30
- ggml/src/ggml-opencl/CMakeLists.txt+6
- ggml/src/ggml-opencl/ggml-opencl.cpp+429-13
- ggml/src/ggml-opencl/kernels/cvt.cl+100
- ggml/src/ggml-opencl/kernels/mul_mm_q5_0_f32_l4_lm.cl+173
- ggml/src/ggml-opencl/kernels/mul_mm_q5_1_f32_l4_lm.cl+175
- ggml/src/ggml-opencl/kernels/mul_mv_q5_0_f32.cl+241
- ggml/src/ggml-opencl/kernels/mul_mv_q5_0_f32_flat.cl+243
- ggml/src/ggml-opencl/kernels/mul_mv_q5_1_f32.cl+243
- ggml/src/ggml-opencl/kernels/mul_mv_q5_1_f32_flat.cl+247
- ggml/src/ggml-sycl/common.hpp+1
- ggml/src/ggml-sycl/convert.cpp+23-2
- ggml/src/ggml-sycl/dequantize.hpp+529
- ggml/src/ggml-sycl/dmmv.cpp+119-1
- ggml/src/ggml-sycl/fattn-common.hpp+3-3
- ggml/src/ggml-sycl/getrows.cpp+75-3
- ggml/src/ggml-sycl/ggml-sycl.cpp+70
- ggml/src/ggml-sycl/mmvq.cpp+29-1
- ggml/src/ggml-sycl/quants.hpp+25
- ggml/src/ggml-sycl/vecdotq.hpp+35
- ggml/src/ggml-vulkan/ggml-vulkan.cpp+118-66
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vecq_funcs.glsl+66-42
- ggml/src/ggml-webgpu/wgsl-shaders/cpy.wgsl+4-5
- gguf-py/gguf/constants.py+8
- include/llama.h+1
- scripts/sync_vendor.py+1-1
- src/llama-context.cpp+15-11
- src/llama-cparams.h+1
- src/llama-model.cpp+23-20
- src/llama-vocab.cpp+9-6
- src/models/exaone4.cpp+35-12
- tests/test-reasoning-budget.cpp+72-1
- tools/mtmd/CMakeLists.txt+1
- tools/mtmd/clip-impl.h+2
- tools/mtmd/clip.cpp+28-1
- tools/mtmd/models/exaone4_5.cpp+170
- tools/mtmd/models/models.h+5
- tools/mtmd/mtmd.cpp+7
- tools/server/server-context.cpp+23-4
- vendor/cpp-httplib/httplib.cpp+26-10
- vendor/cpp-httplib/httplib.h+2-2
0 commit comments