localcode 0.2.15__tar.gz → 0.2.16__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {localcode-0.2.15/src/localcode.egg-info → localcode-0.2.16}/PKG-INFO +22 -5
- {localcode-0.2.15 → localcode-0.2.16}/README.md +21 -4
- {localcode-0.2.15 → localcode-0.2.16}/pyproject.toml +1 -1
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/__init__.py +1 -1
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/__init__.py +2 -3
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/helpers.py +0 -10
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/sections.py +2 -11
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/app.py +1 -63
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/autonomy.py +0 -15
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/bootstrap.py +6 -15
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/formatting.py +0 -9
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/model_families.py +1 -1
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/models_catalog.py +45 -46
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/patching.py +0 -25
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/plans.py +0 -8
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/process_registry.py +0 -20
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/recommendations.py +1 -1
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/runtime.py +1 -1
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/snapshots.py +0 -18
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/telemetry.py +0 -18
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/theme.py +1 -20
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tool_parsing.py +0 -11
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tool_router.py +0 -60
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/chat.py +22 -10
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/setup.py +7 -7
- localcode-0.2.16/src/localcode/verification.py +87 -0
- {localcode-0.2.15 → localcode-0.2.16/src/localcode.egg-info}/PKG-INFO +22 -5
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_agent_event_regressions.py +0 -24
- localcode-0.2.15/src/localcode/verification.py +0 -197
- {localcode-0.2.15 → localcode-0.2.16}/LICENSE +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/MANIFEST.in +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/CMakePresets.json +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/LICENSE +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/arm64-apple-clang.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/arm64-windows-llvm.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/build-info.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/common.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/download-models.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/git-vars.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/license.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/llama-config.cmake.in +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/llama.pc.in +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/riscv64-spacemit-linux-gnu-gcc.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/x64-windows-llvm.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/arg.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/arg.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/base64.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser-generator.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser-helpers.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser-helpers.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-diff-analyzer.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-peg-parser.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-peg-parser.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/common.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/console.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/console.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/debug.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/debug.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/download.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/download.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/hf-cache.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/hf-cache.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/http.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/caps.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/caps.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/lexer.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/lexer.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/parser.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/parser.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/runtime.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/runtime.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/string.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/string.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/value.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/value.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-partial.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-partial.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-schema-to-grammar.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-schema-to-grammar.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/llguidance.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/log.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/log.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-cache.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-cache.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-map.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-map.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-mod.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-mod.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/peg-parser.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/peg-parser.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/preset.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/preset.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/reasoning-budget.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/reasoning-budget.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/regex-partial.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/regex-partial.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/sampling.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/sampling.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/speculative.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/speculative.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/unicode.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/unicode.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-alloc.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-backend.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-blas.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cann.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cpp.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cpu.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cuda.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-hexagon.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-metal.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-opencl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-openvino.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-opt.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-rpc.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-sycl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-virtgpu.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-vulkan.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-webgpu.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-zdnn.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-zendnn.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/gguf.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-alloc.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-dl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-dl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-reg.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-blas/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-blas/ggml-blas.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/acl_tensor.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/acl_tensor.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/aclnn_ops.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/aclnn_ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/ggml-cann.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/amx.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/amx.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/mmq.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/mmq.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/cpu-feats.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/repack.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/loongarch/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/powerpc/cpu-feats.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/powerpc/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/cpu-feats.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/repack.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/s390/cpu-feats.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/s390/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/wasm/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/cpu-feats.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/repack.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch-fallback.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/binary-ops.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/binary-ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/cmake/FindSIMD.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/hbm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/hbm.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kernels.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kernels.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kleidiai.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kleidiai.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/llamafile/sgemm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/llamafile/sgemm.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ops.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/quants.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/repack.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/repack.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/simd-gemm.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/simd-mappings.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime1_kernels.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime_kernels.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/traits.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/traits.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/unary-ops.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/unary-ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/vec.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/vec.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/cuda.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/hip.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/musa.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/ggml-hexagon.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/act-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/argsort-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/binary-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cmake-toolchain.cmake +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cpy-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cumsum-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/flash-attn-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/get-rows-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dma.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dma.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dump.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-fastdiv.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-matmul-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-profile.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-ctx.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-msg.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-arith.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-base.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-copy.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-div.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-dump.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-exp.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-floor.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-inverse.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-reduce.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-scale.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-sigmoid.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-sqrt.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-types.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/main.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/matmul-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/repeat-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/rope-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/set-rows-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/softmax-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/ssm-conv.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/sum-rows-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/unary-ops.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/worker-pool.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/worker-pool.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp-drv.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp-drv.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/libdl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/op-desc.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hip/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-common.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-context.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-context.m +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.m +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-ops.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-ops.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal.metal +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/turbo-matrices.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/turbo-wht.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-musa/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-opencl/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-opencl/ggml-opencl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-decoder.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-decoder.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino-extra.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino-extra.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-quants.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-quants.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/decoder.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/frontend.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/frontend.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/input_model.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/input_model.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/node_context.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/cont.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/cpy.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/flash_attn_ext.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/get_rows.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/glu_geglu.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/glu_swiglu.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/mulmat.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/permute.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/reshape.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/rms_norm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/rope.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/scale.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/set_rows.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/softmax.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/transpose.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/unary_silu.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/view.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op_table.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op_table.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/eliminate_zp.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/eliminate_zp.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/fuse_to_sdpa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/fuse_to_sdpa.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/squeeze_matmul.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/squeeze_matmul.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/translate_session.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/translate_session.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/utils.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/utils.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-opt.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-quants.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-quants.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-rpc/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-rpc/ggml-rpc.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/add-id.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/add-id.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/backend.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/binbcast.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/binbcast.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/common.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/common.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/concat.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/concat.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/conv.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/conv.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/convert.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/convert.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/count-equal.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/count-equal.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/cpy.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/cpy.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dequantize.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dmmv.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dmmv.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dpct/helper.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/element_wise.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/element_wise.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-common.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-tile.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-tile.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-vec.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gated_delta_net.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gated_delta_net.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gemm.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/getrows.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/getrows.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/ggml-sycl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gla.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gla.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/im2col.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/im2col.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmq.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmq.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmvq.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmvq.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/norm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/norm.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/outprod.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/outprod.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad_reflect_1d.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad_reflect_1d.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/presets.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/quantize.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/quants.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/repeat_back.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/repeat_back.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/roll.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/roll.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/rope.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/rope.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set_rows.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set_rows.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/softmax.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/softmax.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/ssm_conv.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/ssm_conv.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/sycl_hw.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/sycl_hw.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq112-dv112.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq128-dv128.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq256-dv256.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq40-dv40.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq576-dv512.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq64-dv64.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq72-dv72.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq80-dv80.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq96-dv96.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-f16.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q8_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-f16.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q8_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-f16.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q8_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-f16.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q8_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-f16.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q8_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-f16.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q8_0.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/tsembd.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/tsembd.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/type.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/upscale.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/upscale.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/vecdotq.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/wkv.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/wkv.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-threading.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-threading.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-turbo-quant.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/apir_cs_ggml-rpc-front.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/apir_cs_ggml-rpc-back.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-convert.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-backend.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-buffer-type.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-buffer.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-device.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.gen.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-virgl-apir.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/api_remoting.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_backend.gen.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_backend.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs_ggml.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs_rpc.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-buffer-type.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-buffer.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-device.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-reg.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-remoting.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/include/apir_hw.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-apir.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-backend.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-buffer-type.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-buffer.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-device.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward.gen.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-shm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-shm.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-utils.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-utils.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/ggml-vulkan.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/ggml-webgpu-shader-lib.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/ggml-webgpu.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/pre_wgsl.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/common.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/ggml-zdnn.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/mmf.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/mmf.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/utils.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/utils.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zendnn/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zendnn/ggml-zendnn.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml.c +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/gguf.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/include/llama-cpp.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/include/llama.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/licenses/LICENSE-jsonhpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-adapter.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-adapter.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-arch.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-arch.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-batch.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-batch.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-chat.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-chat.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-context.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-context.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-cparams.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-cparams.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-ext.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-grammar.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-grammar.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-graph.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-graph.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-hparams.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-hparams.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-impl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-io.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-io.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache-iswa.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cells.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid-iswa.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-recurrent.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-recurrent.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-mmap.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-mmap.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-loader.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-loader.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-saver.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-saver.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-quant.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-quant.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-sampler.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-sampler.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-vocab.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-vocab.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/afmoe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/apertus.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/arcee.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/arctic.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/arwkv7.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/baichuan.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bailingmoe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bailingmoe2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bert.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bitnet.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bloom.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/chameleon.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/chatglm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/codeshell.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/cogvlm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/cohere2-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/command-r.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/dbrx.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/deci.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/deepseek.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/deepseek2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/delta-net-base.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/dots1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/dream.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/ernie4-5-moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/ernie4-5.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/eurobert.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/exaone-moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/exaone.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/exaone4.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/falcon-h1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/falcon.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma-embedding.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma2-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma3n-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma4-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/glm4-moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/glm4.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gpt2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gptneox.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/granite-hybrid.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/granite.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/grok.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/grovemoe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/hunyuan-dense.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/hunyuan-moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/internlm2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/jais.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/jais2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/jamba.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/kimi-linear.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/lfm2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llada-moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llada.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llama-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llama.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/maincoder.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mamba-base.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mamba.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mimo2-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/minicpm3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/minimax-m2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mistral3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/models.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/modern-bert.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mpt.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/nemotron-h.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/nemotron.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/neo-bert.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/olmo.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/olmo2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/olmoe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/openai-moe-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/openelm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/orion.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/paddleocr.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/pangu-embedded.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/phi2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/phi3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plamo.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plamo2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plamo3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen2moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen2vl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen35.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen35moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3next.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3vl-moe.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3vl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/refact.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rnd1.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv6-base.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv6.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv6qwen2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv7-base.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv7.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/seed-oss.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/smallthinker.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/smollm3.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/stablelm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/starcoder.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/starcoder2.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/step35-iswa.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/t5-dec.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/t5-enc.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/wavtokenizer-dec.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/xverse.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/turbo-rotation-data-32.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/turbo-rotation-data.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode-data.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode-data.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/batched-bench/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/batched-bench/batched-bench.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cli/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cli/cli.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/completion/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/completion/completion.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/cvector-generator.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/mean.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/pca.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/export-lora/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/export-lora/export-lora.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/fit-params/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/fit-params/fit-params.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/gguf-split/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/gguf-split/gguf-split.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/imatrix/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/imatrix/imatrix.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/llama-bench/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/llama-bench/llama-bench.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip-graph.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip-impl.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip-model.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/debug/mtmd-debug.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/debug/mtmd-debug.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/deprecation-warning.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/cogvlm.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/conformer.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/deepseekocr.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/gemma4v.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/glm4v.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/hunyuanocr.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/internvl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/kimik25.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/kimivl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/llama4.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/llava.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/minicpmv.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/mobilenetv5.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/models.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/nemotron-v2-vl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/paddleocr.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/pixtral.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/qwen2vl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/qwen3vl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/siglip.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/whisper-enc.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/youtuvl.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-audio.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-audio.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-cli.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-helper.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-helper.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-image.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-image.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/parser/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/parser/debug-template-parser.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/parser/template-analysis.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/perplexity/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/perplexity/perplexity.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/quantize/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/quantize/quantize.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/results/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/results/results.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/rpc/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/rpc/rpc-server.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-common.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-common.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-context.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-context.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-cors-proxy.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-http.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-http.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-models.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-models.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-queue.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-queue.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-task.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-task.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-tools.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-tools.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tokenize/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tokenize/tokenize.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tts/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tts/tts.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/cpp-httplib/CMakeLists.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/cpp-httplib/httplib.cpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/cpp-httplib/httplib.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/miniaudio/miniaudio.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/nlohmann/json.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/nlohmann/json_fwd.hpp +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/sheredom/subprocess.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/stb/stb_image.h +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/setup.cfg +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/setup.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/__main__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/_subproc_env.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/app_tasks.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/constants.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/context.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/goal.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/hooks.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/loop.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/prompt_context.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/prompts.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/recovery.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/streaming.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/tool_execution.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/tool_orchestration.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/turn_finalization.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/approvals.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/auto_compact.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/bin/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/bin/llama-server +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/cache.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/checkpoint.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/compact.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/compaction.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/composer.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/config.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/context.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/display.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/embeddings.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/entrypoint.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/errors.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/events.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/features.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/headless_json.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/health.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/hf_quants.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/history.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/hooks.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/indexer.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/injection_defense.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/launcher.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/logging_utils.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/lsp.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/mcp.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/memory_guard.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/model_config.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/models.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/notebook.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/output.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/paths.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/performance.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/permissions.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/permissions_v2.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/recovery.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/runtime_diffusion.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/server_manager.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/session.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/shell.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/debug.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/edit-verified.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/explain.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/git-commit-safely.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/locate.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/plan-task.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/review.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/run-tests.md +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/sounds.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/thermal.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/thinking.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/toolkit.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/agent.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/append_file.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/base.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/bash.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/edit_diff.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/edit_file.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/facts.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/glob_tool.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/grep.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/launch_app.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/list_files.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/multi_edit.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/plan_mode.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/read_file.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/skill_tool.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/web_fetch.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/web_search.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/write_file.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/app.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/bridge.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/mode_picker.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/model_picker.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/styles/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/styles/app.tcss +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/approval.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/chat_log.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/messages/__init__.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/messages/diff.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/voice_visualizer.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/turn_diff.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/undo.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode/voice.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/SOURCES.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/dependency_links.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/entry_points.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/requires.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/top_level.txt +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_architecture.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_bootstrap.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_checkpoint.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_churn_detection.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_compaction.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_agent.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_bg_download.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_binary.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_cli.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_diffusion.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_download.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_hardening.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_install.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_machines.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_model_picker.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_models_matrix.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_tui.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_vision.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_voice.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_whisper.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_config.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_context.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_context_pipeline_e2e.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_download.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_embeddings_retrieval.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_fresh_install.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_kv_cap.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_model_config.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_models_catalog.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_output.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_prompt_language_steering.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_real_models.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_run_json.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_runtime.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_subproc_env.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_thermal.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_toolkit.py +0 -0
- {localcode-0.2.15 → localcode-0.2.16}/tests/test_tui_input.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: localcode
|
|
3
|
-
Version: 0.2.
|
|
3
|
+
Version: 0.2.16
|
|
4
4
|
Summary: High-performance AI coding on consumer hardware.
|
|
5
5
|
Author: LocalCode contributors
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -54,7 +54,7 @@ Dynamic: license-file
|
|
|
54
54
|
<p align="center">
|
|
55
55
|
<img src="https://img.shields.io/pypi/v/localcode?style=flat-square&color=7c4dff" alt="PyPI">
|
|
56
56
|
<img src="https://img.shields.io/badge/license-Apache_2.0-4caf50?style=flat-square" alt="License">
|
|
57
|
-
<img src="https://img.shields.io/badge/python-3.
|
|
57
|
+
<img src="https://img.shields.io/badge/python-3.9+-3776ab?style=flat-square" alt="Python">
|
|
58
58
|
<img src="https://img.shields.io/badge/platform-Apple%20Silicon-999999?style=flat-square" alt="Platform">
|
|
59
59
|
</p>
|
|
60
60
|
|
|
@@ -108,7 +108,7 @@ We are building for a world of truly democratized AI — where everyone has acce
|
|
|
108
108
|
|
|
109
109
|
- **Mac with Apple Silicon**
|
|
110
110
|
- **16 GB RAM** minimum
|
|
111
|
-
- **Python 3.
|
|
111
|
+
- **Python 3.9+**
|
|
112
112
|
- **~12 GB free disk** (10 GB model + server)
|
|
113
113
|
|
|
114
114
|
### Tested hardware
|
|
@@ -122,18 +122,35 @@ LocalCode is early software. Hardware support is expected to broaden, but only t
|
|
|
122
122
|
| M4 Apple Silicon | 24 GB+ | Not yet tested | Expected to support larger contexts, but needs validation |
|
|
123
123
|
| Intel Mac | Any | Not supported | LocalCode targets Apple Silicon |
|
|
124
124
|
|
|
125
|
+
## Models
|
|
126
|
+
|
|
127
|
+
On launch, LocalCode recommends the best model for **your Mac's RAM** — there's no fixed default. You can pick any of these (or a different quant) in the model picker.
|
|
128
|
+
|
|
129
|
+
| Model | Size (quant) | Active params | Min RAM | Architecture |
|
|
130
|
+
| --- | ---: | --- | ---: | --- |
|
|
131
|
+
| Gemma 4 12B | 7.4 GB (Q4) | 12B (dense) | 16 GB | gemma4-iswa |
|
|
132
|
+
| Gemma 4 26B-A4B | 11.2 GB (Q3) | 3.8B (8/128 experts) | 24 GB | gemma4-iswa |
|
|
133
|
+
| Qwen 3.6 35B-A3B | 10.7 GB (Q2) | 3.0B (8+1/256) | 24 GB | qwen35moe |
|
|
134
|
+
| DiffusionGemma 26B-A4B † | 15.7 GB (Q4) | 4B (diffusion MoE) | 32 GB | diffusion_gemma |
|
|
135
|
+
| North-Mini-Code 30B-A3B † | 17.9 GB (Q4) | 3B (30B MoE) | 36 GB | cohere2_moe |
|
|
136
|
+
| Gemma 4 12B (full) | 23.8 GB (BF16) | 12B (dense) | 48 GB | gemma4-iswa |
|
|
137
|
+
| Gemma 4 26B-A4B | 28 GB (Q8) | 3.8B (8/128 experts) | 64 GB | gemma4-iswa |
|
|
138
|
+
| Qwen 3.6 35B-A3B | 38.5 GB (Q8) | 3.0B (8+1/256) | 96 GB | qwen35moe |
|
|
139
|
+
|
|
140
|
+
*Min RAM* is the threshold for auto-recommendation (weights ≤ ~55% of unified memory, leaving room for KV cache + OS); you can still pick a heavier model manually. **†** experimental — pickable but **not** auto-recommended (DiffusionGemma needs a separate runner; `cohere2_moe` is unvalidated on this stack).
|
|
141
|
+
|
|
125
142
|
## How LocalCode works
|
|
126
143
|
|
|
127
144
|
LocalCode runs a custom [llama.cpp](https://github.com/ggerganov/llama.cpp) fork with **TurboQuant KV cache compression** — a technique from Google's ICLR 2026 paper that we patched into llama.cpp for Apple Silicon. This compresses the KV cache 3.8× — fitting 32K context in 355 MiB on a 16 GB MacBook.
|
|
128
145
|
|
|
129
|
-
|
|
146
|
+
LocalCode picks a model based on **your Mac's RAM** — there's no fixed default. It scales from Gemma 4 12B on 16 GB up to Qwen 3.6 35B-A3B on 64 GB+. The recommended models are Mixture-of-Experts — only ~3.8 B parameters active per token — which is what makes ~27 tok/s possible on a laptop.
|
|
130
147
|
|
|
131
148
|
Under the hood:
|
|
132
149
|
|
|
133
150
|
- **TurboQuant KV cache** — asymmetric q8\_0-K + turbo4-V quantization, 3.8× compression vs. f16
|
|
134
151
|
- **Multi-region mmap patch** — fixes a Metal OOM crash where llama.cpp's loader spanned the entire GGUF file into one Metal buffer
|
|
135
152
|
- **GPU memory unlock** — auto-prompts to raise `iogpu.wired_limit_mb` for full Metal offload
|
|
136
|
-
- **Agent loop** —
|
|
153
|
+
- **Agent loop** — goal-typed routing (build / edit / run / chat) with task state, evidence-driven completion, and recovery modes for small-model failure patterns
|
|
137
154
|
|
|
138
155
|
## Sponsors
|
|
139
156
|
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
<p align="center">
|
|
10
10
|
<img src="https://img.shields.io/pypi/v/localcode?style=flat-square&color=7c4dff" alt="PyPI">
|
|
11
11
|
<img src="https://img.shields.io/badge/license-Apache_2.0-4caf50?style=flat-square" alt="License">
|
|
12
|
-
<img src="https://img.shields.io/badge/python-3.
|
|
12
|
+
<img src="https://img.shields.io/badge/python-3.9+-3776ab?style=flat-square" alt="Python">
|
|
13
13
|
<img src="https://img.shields.io/badge/platform-Apple%20Silicon-999999?style=flat-square" alt="Platform">
|
|
14
14
|
</p>
|
|
15
15
|
|
|
@@ -63,7 +63,7 @@ We are building for a world of truly democratized AI — where everyone has acce
|
|
|
63
63
|
|
|
64
64
|
- **Mac with Apple Silicon**
|
|
65
65
|
- **16 GB RAM** minimum
|
|
66
|
-
- **Python 3.
|
|
66
|
+
- **Python 3.9+**
|
|
67
67
|
- **~12 GB free disk** (10 GB model + server)
|
|
68
68
|
|
|
69
69
|
### Tested hardware
|
|
@@ -77,18 +77,35 @@ LocalCode is early software. Hardware support is expected to broaden, but only t
|
|
|
77
77
|
| M4 Apple Silicon | 24 GB+ | Not yet tested | Expected to support larger contexts, but needs validation |
|
|
78
78
|
| Intel Mac | Any | Not supported | LocalCode targets Apple Silicon |
|
|
79
79
|
|
|
80
|
+
## Models
|
|
81
|
+
|
|
82
|
+
On launch, LocalCode recommends the best model for **your Mac's RAM** — there's no fixed default. You can pick any of these (or a different quant) in the model picker.
|
|
83
|
+
|
|
84
|
+
| Model | Size (quant) | Active params | Min RAM | Architecture |
|
|
85
|
+
| --- | ---: | --- | ---: | --- |
|
|
86
|
+
| Gemma 4 12B | 7.4 GB (Q4) | 12B (dense) | 16 GB | gemma4-iswa |
|
|
87
|
+
| Gemma 4 26B-A4B | 11.2 GB (Q3) | 3.8B (8/128 experts) | 24 GB | gemma4-iswa |
|
|
88
|
+
| Qwen 3.6 35B-A3B | 10.7 GB (Q2) | 3.0B (8+1/256) | 24 GB | qwen35moe |
|
|
89
|
+
| DiffusionGemma 26B-A4B † | 15.7 GB (Q4) | 4B (diffusion MoE) | 32 GB | diffusion_gemma |
|
|
90
|
+
| North-Mini-Code 30B-A3B † | 17.9 GB (Q4) | 3B (30B MoE) | 36 GB | cohere2_moe |
|
|
91
|
+
| Gemma 4 12B (full) | 23.8 GB (BF16) | 12B (dense) | 48 GB | gemma4-iswa |
|
|
92
|
+
| Gemma 4 26B-A4B | 28 GB (Q8) | 3.8B (8/128 experts) | 64 GB | gemma4-iswa |
|
|
93
|
+
| Qwen 3.6 35B-A3B | 38.5 GB (Q8) | 3.0B (8+1/256) | 96 GB | qwen35moe |
|
|
94
|
+
|
|
95
|
+
*Min RAM* is the threshold for auto-recommendation (weights ≤ ~55% of unified memory, leaving room for KV cache + OS); you can still pick a heavier model manually. **†** experimental — pickable but **not** auto-recommended (DiffusionGemma needs a separate runner; `cohere2_moe` is unvalidated on this stack).
|
|
96
|
+
|
|
80
97
|
## How LocalCode works
|
|
81
98
|
|
|
82
99
|
LocalCode runs a custom [llama.cpp](https://github.com/ggerganov/llama.cpp) fork with **TurboQuant KV cache compression** — a technique from Google's ICLR 2026 paper that we patched into llama.cpp for Apple Silicon. This compresses the KV cache 3.8× — fitting 32K context in 355 MiB on a 16 GB MacBook.
|
|
83
100
|
|
|
84
|
-
|
|
101
|
+
LocalCode picks a model based on **your Mac's RAM** — there's no fixed default. It scales from Gemma 4 12B on 16 GB up to Qwen 3.6 35B-A3B on 64 GB+. The recommended models are Mixture-of-Experts — only ~3.8 B parameters active per token — which is what makes ~27 tok/s possible on a laptop.
|
|
85
102
|
|
|
86
103
|
Under the hood:
|
|
87
104
|
|
|
88
105
|
- **TurboQuant KV cache** — asymmetric q8\_0-K + turbo4-V quantization, 3.8× compression vs. f16
|
|
89
106
|
- **Multi-region mmap patch** — fixes a Metal OOM crash where llama.cpp's loader spanned the entire GGUF file into one Metal buffer
|
|
90
107
|
- **GPU memory unlock** — auto-prompts to raise `iogpu.wired_limit_mb` for full Metal offload
|
|
91
|
-
- **Agent loop** —
|
|
108
|
+
- **Agent loop** — goal-typed routing (build / edit / run / chat) with task state, evidence-driven completion, and recovery modes for small-model failure patterns
|
|
92
109
|
|
|
93
110
|
## Sponsors
|
|
94
111
|
|
|
@@ -16,7 +16,7 @@ re-exported here so external callers can continue to import from
|
|
|
16
16
|
Background: before T0.1, agent.py was a 1792-line monolith. The split
|
|
17
17
|
broke it into focused modules (each ≤ ~720 LoC), with __init__.py
|
|
18
18
|
reduced to this re-export surface — well under the 400-LoC cap the
|
|
19
|
-
plan sets for god modules (see eval/OPTIMIZATION_PLAN.md § T0).
|
|
19
|
+
plan sets for god modules (see dev/eval/OPTIMIZATION_PLAN.md § T0).
|
|
20
20
|
|
|
21
21
|
Unused-import warnings in this file are expected — every imported
|
|
22
22
|
name is intentionally re-exported. The `# noqa: F401` comments
|
|
@@ -140,7 +140,7 @@ from .helpers import ( # noqa: F401
|
|
|
140
140
|
|
|
141
141
|
# ── Prompt templates + project-instructions loader ────────────────────────
|
|
142
142
|
# Moved to agent/prompts.py during the T0.1-b split. Re-exported here so
|
|
143
|
-
# external callers (eval/prompt_variants.py, tests/promptfoo, app.py,
|
|
143
|
+
# external callers (dev/eval/prompt_variants.py, tests/promptfoo, app.py,
|
|
144
144
|
# tests/test_context_pipeline_e2e.py) that do
|
|
145
145
|
# `from localcode.agent import SYSTEM_PROMPT`
|
|
146
146
|
# keep working unchanged. See agent/prompts.py for the commented
|
|
@@ -160,7 +160,6 @@ from .prompts import ( # noqa: F401 — re-exports for back-compat
|
|
|
160
160
|
# and the dispatcher (for _execute_tool). Plan-mode gating still lives
|
|
161
161
|
# here because it's cross-tool policy, not tool-specific logic.
|
|
162
162
|
|
|
163
|
-
from ..tools import ALL_SCHEMAS as TOOL_SCHEMAS # for agent-loop tool registry injection
|
|
164
163
|
|
|
165
164
|
|
|
166
165
|
# ── Result Management ────────────────────────────────────────────────────
|
|
@@ -53,16 +53,6 @@ __all__: list[str] = []
|
|
|
53
53
|
_SHRINK_GUARD_SOURCE_EXTS = {".py", ".js", ".jsx", ".ts", ".tsx", ".css", ".html"}
|
|
54
54
|
|
|
55
55
|
|
|
56
|
-
def _canonical_creation_root(app: "LocalCodeApp") -> Path | None:
|
|
57
|
-
task = getattr(getattr(app, "session", None), "current_task", None)
|
|
58
|
-
if getattr(task, "task_kind", "") != "new_app":
|
|
59
|
-
return None
|
|
60
|
-
slug = str(getattr(task, "task_slug", "") or "").strip()
|
|
61
|
-
if not slug:
|
|
62
|
-
return None
|
|
63
|
-
return (app.repo_root / slug).resolve()
|
|
64
|
-
|
|
65
|
-
|
|
66
56
|
def _path_within(path: Path, root: Path) -> bool:
|
|
67
57
|
try:
|
|
68
58
|
path.resolve().relative_to(root)
|
|
@@ -14,14 +14,14 @@ Problems with the monolith:
|
|
|
14
14
|
session, which means every new session re-evaluates the whole
|
|
15
15
|
prompt. Our benchmark shows prompt_ms of ~48 ms warm; the
|
|
16
16
|
theoretical floor with a stable prefix cache is ~5-10 ms.
|
|
17
|
-
• No way to A/B sections individually. `eval/prompt_variants.py`
|
|
17
|
+
• No way to A/B sections individually. `dev/eval/prompt_variants.py`
|
|
18
18
|
only supports coarse "strip rule N" mutations. You can't
|
|
19
19
|
answer "what if we drop the build-app rules for debugging
|
|
20
20
|
tasks?" because there's no boundary between them.
|
|
21
21
|
• No way to gate sections on trigger phrases. Every session ships
|
|
22
22
|
rule 10 (open browser) whether or not a web app is in scope.
|
|
23
23
|
|
|
24
|
-
This module is **Phase 1** of T0.11 (see eval/OPTIMIZATION_PLAN.md):
|
|
24
|
+
This module is **Phase 1** of T0.11 (see dev/eval/OPTIMIZATION_PLAN.md):
|
|
25
25
|
introduce the section-registry concept with behaviour-neutral
|
|
26
26
|
defaults. The composer produces the same output as the old
|
|
27
27
|
`SYSTEM_PROMPT.format(...)` for the default all-sections-on case.
|
|
@@ -55,11 +55,9 @@ work is an add-only operation.
|
|
|
55
55
|
from __future__ import annotations
|
|
56
56
|
|
|
57
57
|
from dataclasses import dataclass
|
|
58
|
-
from pathlib import Path
|
|
59
58
|
from typing import Callable
|
|
60
59
|
|
|
61
60
|
from .prompts import SYSTEM_PROMPT
|
|
62
|
-
from .prompts import _load_project_instructions
|
|
63
61
|
|
|
64
62
|
|
|
65
63
|
__all__ = [
|
|
@@ -241,10 +239,3 @@ def compose_system_prompt(
|
|
|
241
239
|
parts.insert(-1, CACHE_BOUNDARY_MARKER)
|
|
242
240
|
|
|
243
241
|
return "".join(parts)
|
|
244
|
-
|
|
245
|
-
|
|
246
|
-
def load_project_instructions(repo_root: Path) -> str:
|
|
247
|
-
"""Convenience re-export so callers outside agent/ that don't
|
|
248
|
-
want to depend on `agent.prompts` internals can build a
|
|
249
|
-
SectionContext purely from this module."""
|
|
250
|
-
return _load_project_instructions(repo_root)
|
|
@@ -4,7 +4,6 @@ from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
|
4
4
|
from dataclasses import replace
|
|
5
5
|
import logging
|
|
6
6
|
from pathlib import Path
|
|
7
|
-
import re
|
|
8
7
|
|
|
9
8
|
from rich.console import Console
|
|
10
9
|
from rich.panel import Panel
|
|
@@ -41,7 +40,7 @@ from .autonomy import AutonomyLevel, apply_autonomy_to_permissions, get_policy
|
|
|
41
40
|
from .hooks import HookRunner
|
|
42
41
|
from .snapshots import SnapshotStore, create_snapshot
|
|
43
42
|
from .turn_diff import TurnDiffTracker, print_turn_diff
|
|
44
|
-
from .agent.goal import
|
|
43
|
+
from .agent.goal import infer_goal_state
|
|
45
44
|
from .performance import detect_machine_profile, benchmark_report, apply_preset, should_promote_legacy_default_to_laptop_26b
|
|
46
45
|
|
|
47
46
|
|
|
@@ -62,67 +61,6 @@ _FOLLOWUP_CHAT_ONLY = {
|
|
|
62
61
|
_CODING_TASK_KINDS = {"new_app", "existing_app_edit", "run_or_launch"}
|
|
63
62
|
|
|
64
63
|
|
|
65
|
-
def _looks_like_task_followup(user_text: str, current_task: object | None) -> bool:
|
|
66
|
-
"""Return true when a short correction should continue the task.
|
|
67
|
-
|
|
68
|
-
This is deliberately conservative: it only attaches to a coding task
|
|
69
|
-
and only for short correction/addition wording. The actual feature
|
|
70
|
-
remains model/tool-driven; LocalCode does not classify domain terms.
|
|
71
|
-
"""
|
|
72
|
-
if current_task is None:
|
|
73
|
-
return False
|
|
74
|
-
if getattr(current_task, "task_kind", "") not in _CODING_TASK_KINDS:
|
|
75
|
-
return False
|
|
76
|
-
text = (user_text or "").strip().lower()
|
|
77
|
-
if not text:
|
|
78
|
-
return False
|
|
79
|
-
first = next(iter(re.findall(r"[a-z0-9]+", text)), "")
|
|
80
|
-
if text in _FOLLOWUP_CHAT_ONLY:
|
|
81
|
-
return False
|
|
82
|
-
if len(text) <= 80 and "?" not in text and first not in {"what", "why", "how", "where", "when", "who"}:
|
|
83
|
-
return True
|
|
84
|
-
return any(
|
|
85
|
-
phrase in text
|
|
86
|
-
for phrase in (
|
|
87
|
-
"i meant",
|
|
88
|
-
"you forgot",
|
|
89
|
-
"missing",
|
|
90
|
-
"add ",
|
|
91
|
-
"also add",
|
|
92
|
-
"it should",
|
|
93
|
-
"should have",
|
|
94
|
-
"doesn't have",
|
|
95
|
-
"didn't add",
|
|
96
|
-
)
|
|
97
|
-
)
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
def _continue_goal_for_task_followup(goal_state: GoalState, user_text: str, current_task: object) -> GoalState:
|
|
101
|
-
criteria = list(getattr(current_task, "success_criteria", []) or goal_state.success_criteria)
|
|
102
|
-
criteria.extend([
|
|
103
|
-
"Follow-up correction is implemented in the existing task context",
|
|
104
|
-
"Assistant does not stop with a permission question when the requested implementation is local and feasible",
|
|
105
|
-
])
|
|
106
|
-
current_kind = getattr(current_task, "task_kind", goal_state.task_kind)
|
|
107
|
-
if current_kind in {"new_app", "existing_app_edit"}:
|
|
108
|
-
goal_type = "edit_existing"
|
|
109
|
-
task_kind = "existing_app_edit"
|
|
110
|
-
else:
|
|
111
|
-
goal_type = getattr(current_task, "goal_type", goal_state.goal_type)
|
|
112
|
-
task_kind = current_kind
|
|
113
|
-
# Preserve task identity; this turn is a correction on existing work,
|
|
114
|
-
# not a fresh task name.
|
|
115
|
-
return replace(
|
|
116
|
-
goal_state,
|
|
117
|
-
goal_type=goal_type,
|
|
118
|
-
task_kind=task_kind,
|
|
119
|
-
task_slug=getattr(current_task, "task_slug", goal_state.task_slug),
|
|
120
|
-
goal_summary=f"{getattr(current_task, 'goal_summary', '')}\nFollow-up: {user_text}".strip()[:240],
|
|
121
|
-
success_criteria=tuple(dict.fromkeys(criteria)),
|
|
122
|
-
allows_blocking_question=False,
|
|
123
|
-
)
|
|
124
|
-
|
|
125
|
-
|
|
126
64
|
def _canonical_project_dir_has_files(repo_root: Path, slug: str) -> bool:
|
|
127
65
|
"""True when a creation task's canonical project directory already exists.
|
|
128
66
|
|
|
@@ -101,18 +101,3 @@ def apply_autonomy_to_permissions(permissions, policy: AutonomyPolicy) -> None:
|
|
|
101
101
|
|
|
102
102
|
if policy.level == AutonomyLevel.FULL_AUTO:
|
|
103
103
|
permissions.approve_all()
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
def format_autonomy_status(level: AutonomyLevel) -> str:
|
|
107
|
-
"""Format current autonomy level for display."""
|
|
108
|
-
policy = POLICIES[level]
|
|
109
|
-
icons = {True: "✓", False: "✗"}
|
|
110
|
-
return (
|
|
111
|
-
f"Autonomy: {level.value}\n"
|
|
112
|
-
f" {policy.description}\n"
|
|
113
|
-
f" reads: {icons[policy.auto_approve_reads]}\n"
|
|
114
|
-
f" writes: {icons[policy.auto_approve_writes]}\n"
|
|
115
|
-
f" bash: {icons[policy.auto_approve_bash]}\n"
|
|
116
|
-
f" installs: {icons[policy.auto_approve_installs]}\n"
|
|
117
|
-
f" git: {icons[policy.auto_approve_git]}"
|
|
118
|
-
)
|
|
@@ -539,13 +539,16 @@ def download_model(
|
|
|
539
539
|
) -> tuple[bool, str]:
|
|
540
540
|
"""Download a GGUF model selected from `models_catalog.CHOICES`.
|
|
541
541
|
|
|
542
|
-
If `choice` is None,
|
|
542
|
+
If `choice` is None, falls back to `recommend()` — the RAM-appropriate model
|
|
543
|
+
for this machine, not a hardcoded default.
|
|
543
544
|
Returns (success, path_or_error_message).
|
|
544
545
|
"""
|
|
545
|
-
from .models_catalog import
|
|
546
|
+
from .models_catalog import recommend
|
|
546
547
|
|
|
547
548
|
if choice is None:
|
|
548
|
-
choice
|
|
549
|
+
# No explicit choice → the RAM-appropriate model for THIS machine,
|
|
550
|
+
# not a hardcoded default.
|
|
551
|
+
choice = recommend()
|
|
549
552
|
|
|
550
553
|
# Already present?
|
|
551
554
|
existing = get_model_path(choice.filename)
|
|
@@ -1247,18 +1250,6 @@ def _ensure_ollama() -> bool:
|
|
|
1247
1250
|
return result.returncode == 0
|
|
1248
1251
|
|
|
1249
1252
|
|
|
1250
|
-
def ensure_model_downloaded(model_tag: str, on_progress: Callable[[str], None] | None = None) -> tuple[bool, str]:
|
|
1251
|
-
"""Ensure the model is downloaded via Ollama. Installs Ollama if needed."""
|
|
1252
|
-
if not _ensure_ollama():
|
|
1253
|
-
return False, "Could not install Ollama. Install manually: https://ollama.com/download"
|
|
1254
|
-
# Start Ollama service if not running
|
|
1255
|
-
if platform.system().lower() == "darwin":
|
|
1256
|
-
subprocess.Popen(["ollama", "serve"], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL,
|
|
1257
|
-
start_new_session=True)
|
|
1258
|
-
import time; time.sleep(2)
|
|
1259
|
-
return pull_model(model_tag, on_progress=on_progress)
|
|
1260
|
-
|
|
1261
|
-
|
|
1262
1253
|
def build_turboquant(on_progress: Callable[[str], None] | None = None) -> tuple[bool, str]:
|
|
1263
1254
|
"""Build the TurboQuant llama.cpp fork from source with Metal support."""
|
|
1264
1255
|
source = _find_turboquant_source()
|
|
@@ -56,15 +56,6 @@ def truncate_with_tail(
|
|
|
56
56
|
return "\n".join(head_block + [ellipsis] + tail_block)
|
|
57
57
|
|
|
58
58
|
|
|
59
|
-
def truncate_one_line(text: str, max_chars: int = 80) -> str:
|
|
60
|
-
"""Truncate to a single line for inline display (e.g. tool-call
|
|
61
|
-
args summary). Replaces newlines with spaces, hard-caps length."""
|
|
62
|
-
s = (text or "").replace("\n", " ").strip()
|
|
63
|
-
if len(s) <= max_chars:
|
|
64
|
-
return s
|
|
65
|
-
return s[: max_chars - 1] + "…"
|
|
66
|
-
|
|
67
|
-
|
|
68
59
|
def split_stdout_stderr(text: str) -> tuple[str, str]:
|
|
69
60
|
"""Heuristic split of bash output into (stdout, stderr).
|
|
70
61
|
|
|
@@ -31,7 +31,7 @@ Scope we DO NOT cover here:
|
|
|
31
31
|
override yet).
|
|
32
32
|
- Prompt rendering differences — the SYSTEM_PROMPT content itself
|
|
33
33
|
is still one string, and word-level per-family variants would live
|
|
34
|
-
in eval/prompt_variants.py, not here.
|
|
34
|
+
in dev/eval/prompt_variants.py, not here.
|
|
35
35
|
"""
|
|
36
36
|
from __future__ import annotations
|
|
37
37
|
|
|
@@ -319,25 +319,57 @@ def _system_ram_gb() -> int:
|
|
|
319
319
|
return 16
|
|
320
320
|
|
|
321
321
|
|
|
322
|
+
# Architectures we never AUTO-recommend (users can still pick them explicitly in
|
|
323
|
+
# the model picker): diffusion needs a separate one-shot runner — not the
|
|
324
|
+
# standard llama-server — and cohere2_moe is unvalidated on this stack.
|
|
325
|
+
_NO_AUTO_RECOMMEND_ARCHS = {"diffusion_gemma", "cohere2_moe"}
|
|
326
|
+
|
|
327
|
+
# Capability order for auto-recommend, best → worst for coding-agent use. This
|
|
328
|
+
# is deliberately NOT raw file size: the big MoEs measure ~95% HumanEval here
|
|
329
|
+
# (even at low bit) and must outrank the 12B dense, and a higher-bit quant of a
|
|
330
|
+
# family wins. A 12B-BF16 must never be recommended over a 26B/35B MoE just
|
|
331
|
+
# because its file happens to be larger.
|
|
332
|
+
_RECOMMEND_ORDER = [
|
|
333
|
+
"qwen-q8", # 35B-A3B MoE, near-lossless Q8
|
|
334
|
+
"gemma-q8", # 26B-A4B MoE, near-lossless Q8
|
|
335
|
+
"qwen", # 35B-A3B MoE Q2 — 94.7% HumanEval
|
|
336
|
+
"gemma", # 26B-A4B MoE Q3 — 95.1% HumanEval
|
|
337
|
+
"gemma-12b-bf16", # 12B dense, full precision
|
|
338
|
+
"gemma-12b", # 12B dense Q4
|
|
339
|
+
]
|
|
340
|
+
|
|
341
|
+
|
|
342
|
+
def _capability_rank(choice) -> int:
|
|
343
|
+
"""Lower = more capable. Curated models first; any other production model
|
|
344
|
+
sorts after them — so a newly-added quant is still recommendable, but never
|
|
345
|
+
outranks a curated MoE."""
|
|
346
|
+
order = {k: i for i, k in enumerate(_RECOMMEND_ORDER)}
|
|
347
|
+
return order.get(choice.key, len(_RECOMMEND_ORDER) + 1)
|
|
348
|
+
|
|
349
|
+
|
|
322
350
|
def recommend(ram_gb: int | None = None) -> ModelChoice:
|
|
323
|
-
"""Pick the
|
|
351
|
+
"""Pick the best model for THIS machine's RAM — capability-ranked, never an
|
|
352
|
+
experimental architecture, and never a hardcoded default.
|
|
324
353
|
|
|
325
|
-
|
|
326
|
-
|
|
327
|
-
|
|
328
|
-
|
|
354
|
+
Weights must fit in ~55% of unified memory (leaves room for KV cache,
|
|
355
|
+
activations, OS). Among the production-ready models that fit, return the
|
|
356
|
+
most capable (see ``_RECOMMEND_ORDER``) so the recommendation scales with
|
|
357
|
+
the user's hardware instead of defaulting to any one model.
|
|
329
358
|
"""
|
|
330
359
|
if ram_gb is None:
|
|
331
360
|
ram_gb = _system_ram_gb()
|
|
332
|
-
# Sort candidates by size_gb; pick the biggest whose weights fit
|
|
333
|
-
# in ~55% of RAM (leaves room for KV cache, activations, OS).
|
|
334
361
|
budget = ram_gb * 0.55
|
|
335
|
-
|
|
336
|
-
|
|
337
|
-
|
|
338
|
-
|
|
339
|
-
|
|
340
|
-
|
|
362
|
+
candidates = [
|
|
363
|
+
c for c in CHOICES
|
|
364
|
+
if c.architecture not in _NO_AUTO_RECOMMEND_ARCHS and c.size_gb <= budget
|
|
365
|
+
]
|
|
366
|
+
if candidates:
|
|
367
|
+
# Most capable that fits; tie-break toward the larger (better-quant) file.
|
|
368
|
+
return min(candidates, key=lambda c: (_capability_rank(c), -c.size_gb))
|
|
369
|
+
# Nothing fits the budget — smallest production-ready model so the user still
|
|
370
|
+
# gets something runnable rather than an impossible recommendation.
|
|
371
|
+
prod = [c for c in CHOICES if c.architecture not in _NO_AUTO_RECOMMEND_ARCHS]
|
|
372
|
+
return min(prod or CHOICES, key=lambda c: c.size_gb)
|
|
341
373
|
|
|
342
374
|
|
|
343
375
|
def by_key(key: str) -> ModelChoice | None:
|
|
@@ -404,39 +436,6 @@ def current(config) -> ModelChoice | None:
|
|
|
404
436
|
return by_filename(name)
|
|
405
437
|
|
|
406
438
|
|
|
407
|
-
def format_choice_long(c: ModelChoice, *, downloaded: bool, current_marker: bool = False) -> str:
|
|
408
|
-
"""Multi-line formatted description for the picker UI."""
|
|
409
|
-
marker = " (current)" if current_marker else ""
|
|
410
|
-
status = "downloaded" if downloaded else f"will download {c.size_gb:.1f} GB"
|
|
411
|
-
if c.humaneval_pass_at_1 is not None:
|
|
412
|
-
bench = f"{c.humaneval_pass_at_1*100:.1f}% HumanEval pass@1 (measured on this stack)"
|
|
413
|
-
else:
|
|
414
|
-
bench = "no benchmark (untested on this stack)"
|
|
415
|
-
# Warn if this model is too big for the current Mac's RAM budget.
|
|
416
|
-
# Short inline warning; the picker screen also dims models with a
|
|
417
|
-
# bad fit so users can see at a glance.
|
|
418
|
-
try:
|
|
419
|
-
from .health import estimate_fit
|
|
420
|
-
fits, reason = estimate_fit(c.size_gb)
|
|
421
|
-
except Exception:
|
|
422
|
-
fits, reason = True, ""
|
|
423
|
-
fit_line = "" if fits else f" ⚠ fit: {reason}\n"
|
|
424
|
-
return (
|
|
425
|
-
f"[{c.key}] {c.name}{marker}\n"
|
|
426
|
-
f" source: {c.hf_repo}\n"
|
|
427
|
-
f" url: {c.hf_url}\n"
|
|
428
|
-
f" filename: {c.filename}\n"
|
|
429
|
-
f" size: {c.size_gb:.1f} GB ({status})\n"
|
|
430
|
-
f"{fit_line}"
|
|
431
|
-
f" active: {c.active_params}\n"
|
|
432
|
-
f" arch: {c.architecture}\n"
|
|
433
|
-
f" license: {c.license}\n"
|
|
434
|
-
f" benchmark: {bench}\n"
|
|
435
|
-
f" download path: {c.local_path}\n"
|
|
436
|
-
f" note: {c.notes}"
|
|
437
|
-
)
|
|
438
|
-
|
|
439
|
-
|
|
440
439
|
# ---------------------------------------------------------------------------
|
|
441
440
|
# Curated MODEL-GROUP layer (ADDITIVE — built on top of the catalog above).
|
|
442
441
|
#
|
|
@@ -1,9 +1,6 @@
|
|
|
1
1
|
from __future__ import annotations
|
|
2
2
|
|
|
3
3
|
import re
|
|
4
|
-
import subprocess
|
|
5
|
-
import tempfile
|
|
6
|
-
from pathlib import Path
|
|
7
4
|
from dataclasses import dataclass
|
|
8
5
|
|
|
9
6
|
|
|
@@ -24,13 +21,6 @@ class DiffFile:
|
|
|
24
21
|
hunks: list[DiffHunk]
|
|
25
22
|
|
|
26
23
|
|
|
27
|
-
def extract_last_diff_block(text: str) -> str | None:
|
|
28
|
-
matches = DIFF_BLOCK_RE.findall(text)
|
|
29
|
-
if not matches:
|
|
30
|
-
return None
|
|
31
|
-
return matches[-1].strip()
|
|
32
|
-
|
|
33
|
-
|
|
34
24
|
def parse_diff(diff_text: str) -> list[DiffFile]:
|
|
35
25
|
files: list[DiffFile] = []
|
|
36
26
|
current: DiffFile | None = None
|
|
@@ -73,18 +63,3 @@ def build_diff(selected_files: list[DiffFile]) -> str:
|
|
|
73
63
|
blocks.append(hunk.header)
|
|
74
64
|
blocks.extend(hunk.lines)
|
|
75
65
|
return "\n".join(blocks) + ("\n" if blocks else "")
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
def apply_diff(repo_root: Path, diff_text: str) -> tuple[bool, str]:
|
|
79
|
-
with tempfile.NamedTemporaryFile("w", suffix=".diff", delete=False) as handle:
|
|
80
|
-
handle.write(diff_text)
|
|
81
|
-
patch_path = Path(handle.name)
|
|
82
|
-
result = subprocess.run(
|
|
83
|
-
["git", "apply", "--reject", "--whitespace=nowarn", str(patch_path)],
|
|
84
|
-
cwd=repo_root,
|
|
85
|
-
capture_output=True,
|
|
86
|
-
text=True,
|
|
87
|
-
check=False,
|
|
88
|
-
)
|
|
89
|
-
output = (result.stdout + "\n" + result.stderr).strip()
|
|
90
|
-
return result.returncode == 0, output or "Patch applied."
|
|
@@ -104,14 +104,6 @@ def read_plan(slug: str) -> str | None:
|
|
|
104
104
|
return None
|
|
105
105
|
|
|
106
106
|
|
|
107
|
-
def write_plan(slug: str, content: str) -> Path:
|
|
108
|
-
"""Persist the plan. Returns the path on disk so callers can surface it."""
|
|
109
|
-
ensure_plans_dir()
|
|
110
|
-
p = plan_path(slug)
|
|
111
|
-
p.write_text(content, encoding="utf-8")
|
|
112
|
-
return p
|
|
113
|
-
|
|
114
|
-
|
|
115
107
|
def new_slug() -> str:
|
|
116
108
|
"""Generate a fresh slug, retrying up to 10 times if a file already
|
|
117
109
|
exists (very unlikely but keeps us honest)."""
|
|
@@ -151,26 +151,6 @@ def process_summary(repo_root: Path | str) -> str:
|
|
|
151
151
|
return "\n".join(lines)
|
|
152
152
|
|
|
153
153
|
|
|
154
|
-
def stop_all_records(repo_root: Path | str) -> str:
|
|
155
|
-
records = load_records(repo_root)
|
|
156
|
-
if not records:
|
|
157
|
-
return "No LocalCode-managed processes recorded."
|
|
158
|
-
stopped = 0
|
|
159
|
-
skipped = 0
|
|
160
|
-
for record in list(records):
|
|
161
|
-
if record.stopped_at:
|
|
162
|
-
skipped += 1
|
|
163
|
-
continue
|
|
164
|
-
if record.pid <= 0 or not _pid_alive(record.pid):
|
|
165
|
-
skipped += 1
|
|
166
|
-
continue
|
|
167
|
-
if stop_record(repo_root, record):
|
|
168
|
-
stopped += 1
|
|
169
|
-
else:
|
|
170
|
-
skipped += 1
|
|
171
|
-
return f"Stopped {stopped} LocalCode-managed process group(s). Skipped {skipped}."
|
|
172
|
-
|
|
173
|
-
|
|
174
154
|
def _pid_alive(pid: int) -> bool:
|
|
175
155
|
try:
|
|
176
156
|
os.kill(pid, 0)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
"""Per-machine model launch recommendations — the output of the model-opt loop.
|
|
2
2
|
|
|
3
|
-
The offline optimizer (eval/model_opt.py) sweeps quants/params, scores each
|
|
3
|
+
The offline optimizer (dev/eval/model_opt.py) sweeps quants/params, scores each
|
|
4
4
|
combo on the eval suite, and writes the winner here. At launch,
|
|
5
5
|
``runtime.llama_server_command`` consults ``load_overrides`` so the tuned
|
|
6
6
|
params are applied automatically.
|
|
@@ -217,7 +217,7 @@ class StreamEvent(dict):
|
|
|
217
217
|
def apply_param_overrides(cmd: list[str], env: dict | None = None) -> list[str]:
|
|
218
218
|
"""Rewrite llama-server flags from ``LOCALCODE_OVERRIDE_*`` env vars.
|
|
219
219
|
|
|
220
|
-
Lets the offline model-optimizer (eval/model_opt.py) sweep launch
|
|
220
|
+
Lets the offline model-optimizer (dev/eval/model_opt.py) sweep launch
|
|
221
221
|
parameters — GPU layers, context size, threads, batch — WITHOUT editing
|
|
222
222
|
config or the catalog. Only flags already present in ``cmd`` are
|
|
223
223
|
rewritten; an unset env var leaves the command untouched, so the default
|
|
@@ -193,21 +193,3 @@ def create_snapshot(session_id: str, repo_root: str, messages: list[dict],
|
|
|
193
193
|
store = SnapshotStore()
|
|
194
194
|
store.save(snapshot)
|
|
195
195
|
return snapshot
|
|
196
|
-
|
|
197
|
-
|
|
198
|
-
def restore_snapshot(snapshot: GhostSnapshot) -> dict:
|
|
199
|
-
"""Restore file system state from a snapshot.
|
|
200
|
-
|
|
201
|
-
Returns dict of files restored.
|
|
202
|
-
"""
|
|
203
|
-
restored = {}
|
|
204
|
-
root = Path(snapshot.repo_root)
|
|
205
|
-
for rel_path, content in snapshot.file_snapshots.items():
|
|
206
|
-
full = root / rel_path
|
|
207
|
-
try:
|
|
208
|
-
full.parent.mkdir(parents=True, exist_ok=True)
|
|
209
|
-
full.write_text(content)
|
|
210
|
-
restored[rel_path] = "restored"
|
|
211
|
-
except Exception as e:
|
|
212
|
-
restored[rel_path] = f"error: {e}"
|
|
213
|
-
return restored
|