This repository was archived by the owner on Jul 4, 2025. It is now read-only.
1 file changed
+1
-1
lines changed- .github/workflows/build.yml+31-5
- Package.swift-19
- README.md+2-2
- Sources/llama/llama.h-4
- Sources/llama/module.modulemap-5
- build-xcframework.sh+519
- common/arg.cpp+9
- common/chat.cpp+300-139
- common/common.cpp+27-1
- common/common.h+19-4
- common/json-schema-to-grammar.cpp+4-5
- common/json-schema-to-grammar.h-1
- common/ngram-cache.cpp+1
- common/sampling.cpp+45-7
- common/speculative.cpp+1
- examples/embedding/embedding.cpp+1
- examples/json_schema_to_grammar.py+1-1
- examples/llama.swiftui/README.md+15
- examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj+20-10
- examples/lookahead/lookahead.cpp+1
- examples/main/main.cpp+41-14
- examples/parallel/parallel.cpp+1
- examples/passkey/passkey.cpp+1
- examples/quantize/quantize.cpp+1
- examples/server/public_legacy/json-schema-to-grammar.mjs+1-1
- examples/server/server.cpp+36-28
- examples/server/tests/unit/test_tool_call.py+136-100
- examples/server/tests/utils.py+18-2
- examples/server/utils.hpp+2-4
- examples/tts/tts.cpp+2-2
- ggml/include/ggml.h+5-1
- ggml/src/ggml-backend-reg.cpp+1
- ggml/src/ggml-backend.cpp+1
- ggml/src/ggml-cpu/ggml-cpu-quants.c+396-396
- ggml/src/ggml-cpu/ggml-cpu.c+13-13
- ggml/src/ggml-metal/ggml-metal.m+24-23
- ggml/src/ggml-quants.c+114-114
- ggml/src/ggml-sycl/ggml-sycl.cpp+10-8
- ggml/src/ggml.c+3-3
- include/llama.h+17-5
- models/templates/README.md+1-1
- requirements.txt+1
- requirements/requirements-all.txt+1
- requirements/requirements-tool_bench.txt+12
- scripts/apple/validate-apps.sh+5
- scripts/apple/validate-ios.sh+820
- scripts/apple/validate-macos.sh+781
- scripts/apple/validate-tvos.sh+813
- scripts/apple/validate-visionos.sh+811
- scripts/fetch_server_test_models.py+1-1
- scripts/tool_bench.py+368
- scripts/tool_bench.sh+66
- spm-headers/ggml-alloc.h-1
- spm-headers/ggml-backend.h-1
- spm-headers/ggml-cpp.h-1
- spm-headers/ggml-cpu.h-1
- spm-headers/ggml-metal.h-1
- spm-headers/ggml.h-1
- spm-headers/llama.h-1
- src/llama-chat.cpp+1
- src/llama-grammar.cpp+22-22
- src/llama-grammar.h+12-3
- src/llama-kv-cache.h+1
- src/llama-mmap.cpp+11-1
- src/llama-sampling.cpp+43-10
- src/llama-vocab.cpp+1
- tests/test-chat.cpp+122-11
- tests/test-json-schema-to-grammar.cpp+63-63
0 commit comments