1 file changed
+1
-1
lines changed- convert_hf_to_gguf.py+118-6
- docs/backend/SYCL.md+1-1
- docs/build-s390x.md+102-13
- docs/build.md+4
- ggml/CMakeLists.txt+1
- ggml/include/ggml-cpu.h+1
- ggml/src/ggml-cpu/CMakeLists.txt+8
- ggml/src/ggml-cpu/amx/mmq.cpp+10-9
- ggml/src/ggml-cpu/arch/arm/quants.c+109-108
- ggml/src/ggml-cpu/arch/arm/repack.cpp+13-12
- ggml/src/ggml-cpu/arch/loongarch/quants.c+53-52
- ggml/src/ggml-cpu/arch/powerpc/quants.c+56-55
- ggml/src/ggml-cpu/arch/riscv/quants.c+42-41
- ggml/src/ggml-cpu/arch/riscv/repack.cpp+24-23
- ggml/src/ggml-cpu/arch/s390/quants.c+29-28
- ggml/src/ggml-cpu/arch/wasm/quants.c+30-29
- ggml/src/ggml-cpu/arch/x86/quants.c+83-82
- ggml/src/ggml-cpu/arch/x86/repack.cpp+20-19
- ggml/src/ggml-cpu/common.h+3-2
- ggml/src/ggml-cpu/ggml-cpu-impl.h+9-3
- ggml/src/ggml-cpu/ggml-cpu.c+59-16
- ggml/src/ggml-cpu/ggml-cpu.cpp+3
- ggml/src/ggml-cpu/llamafile/sgemm.cpp+3-2
- ggml/src/ggml-cpu/ops.cpp+48-48
- ggml/src/ggml-cpu/quants.c+25-24
- ggml/src/ggml-cpu/repack.cpp+15-14
- ggml/src/ggml-cpu/simd-mappings.h+211-33
- ggml/src/ggml-cpu/vec.cpp+2-2
- ggml/src/ggml-cpu/vec.h+45-45
- ggml/src/ggml-cuda/common.cuh+13-12
- ggml/src/ggml-cuda/fattn-wmma-f16.cu+4
- ggml/src/ggml-cuda/ggml-cuda.cu+15-10
- ggml/src/ggml-impl.h+61-183
- ggml/src/ggml-metal/ggml-metal.m+59-9
- ggml/src/ggml-metal/ggml-metal.metal+72-3
- ggml/src/ggml-musa/mudnn.cuh+2-2
- ggml/src/ggml-opencl/ggml-opencl.cpp+240-535
- ggml/src/ggml-sycl/common.hpp+1-24
- ggml/src/ggml-sycl/ggml-sycl.cpp+2-4
- ggml/src/ggml-sycl/sycl_hw.cpp+3-1
- ggml/src/ggml-sycl/sycl_hw.hpp+3
- ggml/src/ggml-vulkan/CMakeLists.txt+11-1
- ggml/src/ggml.c-11
- ggml/src/gguf.cpp+5-1
- gguf-py/gguf/constants.py+75
- gguf-py/gguf/gguf_writer.py+18
- gguf-py/gguf/tensor_mapping.py+64
- src/llama-arch.cpp+54
- src/llama-arch.h+17
- src/llama-graph.cpp+19-4
- src/llama-graph.h+14-2
- src/llama-hparams.h+6
- src/llama-kv-cache-unified.cpp+28-2
- src/llama-model.cpp+518-1
- src/llama-model.h+22
- src/llama-quant.cpp+8-1
- tests/test-backend-ops.cpp+39-33
0 commit comments