This repository was archived by the owner on Jul 4, 2025. It is now read-only.
1 file changed
+1
-1
lines changed- .gitignore+2
- CONTRIBUTING.md+1-1
- common/arg.cpp+8-3
- common/common.h+1
- convert_hf_to_gguf.py+8-3
- convert_hf_to_gguf_update.py+5
- examples/llava/README-granitevision.md+34-27
- examples/main/main.cpp+26-13
- examples/server/public/index.html.gz
- examples/server/webui/src/components/SettingDialog.tsx+7-7
- ggml/CMakeLists.txt+3
- ggml/include/ggml-alloc.h+1-1
- ggml/include/ggml-backend.h+3-3
- ggml/src/ggml-alloc.c+24-15
- ggml/src/ggml-backend-impl.h+1-1
- ggml/src/ggml-backend.cpp+9-8
- ggml/src/ggml-cann/ggml-cann.cpp+3-2
- ggml/src/ggml-cann/kernels/dup.cpp+3-5
- ggml/src/ggml-cpu/amx/amx.cpp+2-1
- ggml/src/ggml-cpu/ggml-cpu-aarch64.cpp+2-1
- ggml/src/ggml-cpu/ggml-cpu-quants.c+246-1
- ggml/src/ggml-cuda/CMakeLists.txt+9
- ggml/src/ggml-cuda/ggml-cuda.cu+5-3
- ggml/src/ggml-cuda/mmq.cuh+2-2
- ggml/src/ggml-opencl/ggml-opencl.cpp+2-1
- ggml/src/ggml-rpc/ggml-rpc.cpp+2-1
- ggml/src/ggml-sycl/ggml-sycl.cpp+5-3
- ggml/src/ggml-vulkan/ggml-vulkan.cpp+30-28
- ggml/src/ggml-vulkan/vulkan-shaders/dequant_funcs.comp+3-3
- ggml/src/ggml-vulkan/vulkan-shaders/dequant_funcs_cm2.comp+1-1
- ggml/src/ggml-vulkan/vulkan-shaders/get_rows_quant.comp+2
- ggml/src/ggml-vulkan/vulkan-shaders/im2col.comp+31-18
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_s.comp+90
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_xs.comp+87
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_xxs.comp+87
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq3_s.comp+90
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq3_xxs.comp+88
- ggml/src/ggml-vulkan/vulkan-shaders/mul_mm.comp+86-52
- ggml/src/ggml-vulkan/vulkan-shaders/types.comp+37-15
- ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp+9-3
- gguf-py/gguf/metadata.py+28-8
- include/llama.h+1
- models/ggml-vocab-gpt-4o.gguf.inp+112
- models/ggml-vocab-gpt-4o.gguf.out+46
- src/llama-model.cpp+8-5
- src/llama-vocab.cpp+11
- tests/test-backend-ops.cpp+61-44
0 commit comments