LICENSE
MANIFEST.in
README.md
pyproject.toml
setup.py
llama-cpp-turboquant/CMakeLists.txt
llama-cpp-turboquant/CMakePresets.json
llama-cpp-turboquant/LICENSE
llama-cpp-turboquant/cmake/arm64-apple-clang.cmake
llama-cpp-turboquant/cmake/arm64-windows-llvm.cmake
llama-cpp-turboquant/cmake/build-info.cmake
llama-cpp-turboquant/cmake/common.cmake
llama-cpp-turboquant/cmake/download-models.cmake
llama-cpp-turboquant/cmake/git-vars.cmake
llama-cpp-turboquant/cmake/license.cmake
llama-cpp-turboquant/cmake/llama-config.cmake.in
llama-cpp-turboquant/cmake/llama.pc.in
llama-cpp-turboquant/cmake/riscv64-spacemit-linux-gnu-gcc.cmake
llama-cpp-turboquant/cmake/x64-windows-llvm.cmake
llama-cpp-turboquant/common/CMakeLists.txt
llama-cpp-turboquant/common/arg.cpp
llama-cpp-turboquant/common/arg.h
llama-cpp-turboquant/common/base64.hpp
llama-cpp-turboquant/common/chat-auto-parser-generator.cpp
llama-cpp-turboquant/common/chat-auto-parser-helpers.cpp
llama-cpp-turboquant/common/chat-auto-parser-helpers.h
llama-cpp-turboquant/common/chat-auto-parser.h
llama-cpp-turboquant/common/chat-diff-analyzer.cpp
llama-cpp-turboquant/common/chat-peg-parser.cpp
llama-cpp-turboquant/common/chat-peg-parser.h
llama-cpp-turboquant/common/chat.cpp
llama-cpp-turboquant/common/chat.h
llama-cpp-turboquant/common/common.cpp
llama-cpp-turboquant/common/common.h
llama-cpp-turboquant/common/console.cpp
llama-cpp-turboquant/common/console.h
llama-cpp-turboquant/common/debug.cpp
llama-cpp-turboquant/common/debug.h
llama-cpp-turboquant/common/download.cpp
llama-cpp-turboquant/common/download.h
llama-cpp-turboquant/common/hf-cache.cpp
llama-cpp-turboquant/common/hf-cache.h
llama-cpp-turboquant/common/http.h
llama-cpp-turboquant/common/json-partial.cpp
llama-cpp-turboquant/common/json-partial.h
llama-cpp-turboquant/common/json-schema-to-grammar.cpp
llama-cpp-turboquant/common/json-schema-to-grammar.h
llama-cpp-turboquant/common/llguidance.cpp
llama-cpp-turboquant/common/log.cpp
llama-cpp-turboquant/common/log.h
llama-cpp-turboquant/common/ngram-cache.cpp
llama-cpp-turboquant/common/ngram-cache.h
llama-cpp-turboquant/common/ngram-map.cpp
llama-cpp-turboquant/common/ngram-map.h
llama-cpp-turboquant/common/ngram-mod.cpp
llama-cpp-turboquant/common/ngram-mod.h
llama-cpp-turboquant/common/peg-parser.cpp
llama-cpp-turboquant/common/peg-parser.h
llama-cpp-turboquant/common/preset.cpp
llama-cpp-turboquant/common/preset.h
llama-cpp-turboquant/common/reasoning-budget.cpp
llama-cpp-turboquant/common/reasoning-budget.h
llama-cpp-turboquant/common/regex-partial.cpp
llama-cpp-turboquant/common/regex-partial.h
llama-cpp-turboquant/common/sampling.cpp
llama-cpp-turboquant/common/sampling.h
llama-cpp-turboquant/common/speculative.cpp
llama-cpp-turboquant/common/speculative.h
llama-cpp-turboquant/common/unicode.cpp
llama-cpp-turboquant/common/unicode.h
llama-cpp-turboquant/common/jinja/caps.cpp
llama-cpp-turboquant/common/jinja/caps.h
llama-cpp-turboquant/common/jinja/lexer.cpp
llama-cpp-turboquant/common/jinja/lexer.h
llama-cpp-turboquant/common/jinja/parser.cpp
llama-cpp-turboquant/common/jinja/parser.h
llama-cpp-turboquant/common/jinja/runtime.cpp
llama-cpp-turboquant/common/jinja/runtime.h
llama-cpp-turboquant/common/jinja/string.cpp
llama-cpp-turboquant/common/jinja/string.h
llama-cpp-turboquant/common/jinja/utils.h
llama-cpp-turboquant/common/jinja/value.cpp
llama-cpp-turboquant/common/jinja/value.h
llama-cpp-turboquant/ggml/include/ggml-alloc.h
llama-cpp-turboquant/ggml/include/ggml-backend.h
llama-cpp-turboquant/ggml/include/ggml-blas.h
llama-cpp-turboquant/ggml/include/ggml-cann.h
llama-cpp-turboquant/ggml/include/ggml-cpp.h
llama-cpp-turboquant/ggml/include/ggml-cpu.h
llama-cpp-turboquant/ggml/include/ggml-cuda.h
llama-cpp-turboquant/ggml/include/ggml-hexagon.h
llama-cpp-turboquant/ggml/include/ggml-metal.h
llama-cpp-turboquant/ggml/include/ggml-opencl.h
llama-cpp-turboquant/ggml/include/ggml-openvino.h
llama-cpp-turboquant/ggml/include/ggml-opt.h
llama-cpp-turboquant/ggml/include/ggml-rpc.h
llama-cpp-turboquant/ggml/include/ggml-sycl.h
llama-cpp-turboquant/ggml/include/ggml-virtgpu.h
llama-cpp-turboquant/ggml/include/ggml-vulkan.h
llama-cpp-turboquant/ggml/include/ggml-webgpu.h
llama-cpp-turboquant/ggml/include/ggml-zdnn.h
llama-cpp-turboquant/ggml/include/ggml-zendnn.h
llama-cpp-turboquant/ggml/include/ggml.h
llama-cpp-turboquant/ggml/include/gguf.h
llama-cpp-turboquant/ggml/src/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-alloc.c
llama-cpp-turboquant/ggml/src/ggml-backend-dl.cpp
llama-cpp-turboquant/ggml/src/ggml-backend-dl.h
llama-cpp-turboquant/ggml/src/ggml-backend-impl.h
llama-cpp-turboquant/ggml/src/ggml-backend-reg.cpp
llama-cpp-turboquant/ggml/src/ggml-backend.cpp
llama-cpp-turboquant/ggml/src/ggml-common.h
llama-cpp-turboquant/ggml/src/ggml-impl.h
llama-cpp-turboquant/ggml/src/ggml-opt.cpp
llama-cpp-turboquant/ggml/src/ggml-quants.c
llama-cpp-turboquant/ggml/src/ggml-quants.h
llama-cpp-turboquant/ggml/src/ggml-threading.cpp
llama-cpp-turboquant/ggml/src/ggml-threading.h
llama-cpp-turboquant/ggml/src/ggml-turbo-quant.c
llama-cpp-turboquant/ggml/src/ggml.c
llama-cpp-turboquant/ggml/src/ggml.cpp
llama-cpp-turboquant/ggml/src/gguf.cpp
llama-cpp-turboquant/ggml/src/ggml-blas/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-blas/ggml-blas.cpp
llama-cpp-turboquant/ggml/src/ggml-cann/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-cann/acl_tensor.cpp
llama-cpp-turboquant/ggml/src/ggml-cann/acl_tensor.h
llama-cpp-turboquant/ggml/src/ggml-cann/aclnn_ops.cpp
llama-cpp-turboquant/ggml/src/ggml-cann/aclnn_ops.h
llama-cpp-turboquant/ggml/src/ggml-cann/common.h
llama-cpp-turboquant/ggml/src/ggml-cann/ggml-cann.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-cpu/arch-fallback.h
llama-cpp-turboquant/ggml/src/ggml-cpu/binary-ops.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/binary-ops.h
llama-cpp-turboquant/ggml/src/ggml-cpu/common.h
llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu-impl.h
llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu.c
llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/hbm.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/hbm.h
llama-cpp-turboquant/ggml/src/ggml-cpu/ops.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/ops.h
llama-cpp-turboquant/ggml/src/ggml-cpu/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/quants.h
llama-cpp-turboquant/ggml/src/ggml-cpu/repack.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/repack.h
llama-cpp-turboquant/ggml/src/ggml-cpu/simd-gemm.h
llama-cpp-turboquant/ggml/src/ggml-cpu/simd-mappings.h
llama-cpp-turboquant/ggml/src/ggml-cpu/traits.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/traits.h
llama-cpp-turboquant/ggml/src/ggml-cpu/unary-ops.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/unary-ops.h
llama-cpp-turboquant/ggml/src/ggml-cpu/vec.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/vec.h
llama-cpp-turboquant/ggml/src/ggml-cpu/amx/amx.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/amx/amx.h
llama-cpp-turboquant/ggml/src/ggml-cpu/amx/common.h
llama-cpp-turboquant/ggml/src/ggml-cpu/amx/mmq.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/amx/mmq.h
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/cpu-feats.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/repack.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/loongarch/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/powerpc/cpu-feats.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/powerpc/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/cpu-feats.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/repack.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/s390/cpu-feats.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/s390/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/wasm/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/cpu-feats.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/quants.c
llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/repack.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/cmake/FindSIMD.cmake
llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kernels.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kernels.h
llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kleidiai.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kleidiai.h
llama-cpp-turboquant/ggml/src/ggml-cpu/llamafile/sgemm.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/llamafile/sgemm.h
llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime.h
llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime1_kernels.cpp
llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime_kernels.h
llama-cpp-turboquant/ggml/src/ggml-cuda/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/cuda.h
llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/hip.h
llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/musa.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-hexagon/ggml-hexagon.cpp
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp-drv.cpp
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp-drv.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/libdl.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/op-desc.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/act-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/argsort-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/binary-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cmake-toolchain.cmake
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cpy-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cumsum-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/flash-attn-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/get-rows-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dma.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dma.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dump.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-fastdiv.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-utils.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-matmul-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-ops.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-profile.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-utils.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-ctx.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-msg.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-ops.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-arith.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-base.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-copy.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-div.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-dump.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-exp.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-floor.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-inverse.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-reduce.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-scale.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-sigmoid.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-sqrt.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-types.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-utils.h
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/main.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/matmul-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/repeat-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/rope-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/set-rows-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/softmax-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/ssm-conv.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/sum-rows-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/unary-ops.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/worker-pool.c
llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/worker-pool.h
llama-cpp-turboquant/ggml/src/ggml-hip/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-metal/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-common.cpp
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-common.h
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-context.h
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-context.m
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.cpp
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.h
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.m
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-impl.h
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-ops.cpp
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-ops.h
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal.cpp
llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal.metal
llama-cpp-turboquant/ggml/src/ggml-metal/turbo-matrices.h
llama-cpp-turboquant/ggml/src/ggml-metal/turbo-wht.h
llama-cpp-turboquant/ggml/src/ggml-musa/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-opencl/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-opencl/ggml-opencl.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-decoder.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-decoder.h
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino-extra.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino-extra.h
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-quants.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-quants.h
llama-cpp-turboquant/ggml/src/ggml-openvino/utils.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/utils.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/decoder.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/frontend.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/frontend.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/input_model.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/input_model.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/node_context.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op_table.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op_table.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/translate_session.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/translate_session.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/utils.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/utils.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/cont.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/cpy.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/flash_attn_ext.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/get_rows.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/glu_geglu.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/glu_swiglu.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/mulmat.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/permute.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/reshape.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/rms_norm.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/rope.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/scale.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/set_rows.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/softmax.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/transpose.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/unary_silu.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/view.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/eliminate_zp.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/eliminate_zp.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/fuse_to_sdpa.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/fuse_to_sdpa.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.h
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/squeeze_matmul.cpp
llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/squeeze_matmul.h
llama-cpp-turboquant/ggml/src/ggml-rpc/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-rpc/ggml-rpc.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-sycl/add-id.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/add-id.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/backend.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/binbcast.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/binbcast.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/common.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/common.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/concat.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/concat.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/conv.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/conv.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/convert.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/convert.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/count-equal.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/count-equal.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/cpy.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/cpy.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/dequantize.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/dmmv.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/dmmv.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/element_wise.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/element_wise.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-common.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-tile.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-tile.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-vec.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/fattn.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/fattn.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/gated_delta_net.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/gated_delta_net.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/gemm.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/getrows.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/getrows.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/ggml-sycl.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/gla.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/gla.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/im2col.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/im2col.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/mmq.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/mmq.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/mmvq.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/mmvq.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/norm.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/norm.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/outprod.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/outprod.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/pad.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/pad.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/pad_reflect_1d.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/pad_reflect_1d.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/presets.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/quantize.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/quants.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/repeat_back.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/repeat_back.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/roll.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/roll.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/rope.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/rope.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/set.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/set.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/set_rows.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/set_rows.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/softmax.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/softmax.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/ssm_conv.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/ssm_conv.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/sycl_hw.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/sycl_hw.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/tsembd.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/tsembd.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/type.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/upscale.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/upscale.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/vecdotq.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/wkv.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/wkv.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/dpct/helper.hpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq112-dv112.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq128-dv128.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq256-dv256.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq40-dv40.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq576-dv512.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq64-dv64.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq72-dv72.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq80-dv80.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq96-dv96.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-f16.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q8_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-f16.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q8_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-f16.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q8_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-f16.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q8_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-f16.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q8_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-f16.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_0.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_1.cpp
llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q8_0.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-virtgpu/apir_cs_ggml-rpc-front.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-buffer-type.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-buffer.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-device.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-reg.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-remoting.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-apir.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-backend.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-buffer-type.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-buffer.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-device.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-impl.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward.gen.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-shm.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-shm.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-utils.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-utils.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/apir_cs_ggml-rpc-back.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-convert.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-backend.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-buffer-type.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-buffer.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-device.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.gen.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-virgl-apir.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend.cpp
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/api_remoting.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_backend.gen.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_backend.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs_ggml.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs_rpc.h
llama-cpp-turboquant/ggml/src/ggml-virtgpu/include/apir_hw.h
llama-cpp-turboquant/ggml/src/ggml-vulkan/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-vulkan/ggml-vulkan.cpp
llama-cpp-turboquant/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp
llama-cpp-turboquant/ggml/src/ggml-webgpu/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-webgpu/ggml-webgpu-shader-lib.hpp
llama-cpp-turboquant/ggml/src/ggml-webgpu/ggml-webgpu.cpp
llama-cpp-turboquant/ggml/src/ggml-webgpu/pre_wgsl.hpp
llama-cpp-turboquant/ggml/src/ggml-zdnn/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-zdnn/common.hpp
llama-cpp-turboquant/ggml/src/ggml-zdnn/ggml-zdnn.cpp
llama-cpp-turboquant/ggml/src/ggml-zdnn/mmf.cpp
llama-cpp-turboquant/ggml/src/ggml-zdnn/mmf.hpp
llama-cpp-turboquant/ggml/src/ggml-zdnn/utils.cpp
llama-cpp-turboquant/ggml/src/ggml-zdnn/utils.hpp
llama-cpp-turboquant/ggml/src/ggml-zendnn/CMakeLists.txt
llama-cpp-turboquant/ggml/src/ggml-zendnn/ggml-zendnn.cpp
llama-cpp-turboquant/include/llama-cpp.h
llama-cpp-turboquant/include/llama.h
llama-cpp-turboquant/licenses/LICENSE-jsonhpp
llama-cpp-turboquant/src/CMakeLists.txt
llama-cpp-turboquant/src/llama-adapter.cpp
llama-cpp-turboquant/src/llama-adapter.h
llama-cpp-turboquant/src/llama-arch.cpp
llama-cpp-turboquant/src/llama-arch.h
llama-cpp-turboquant/src/llama-batch.cpp
llama-cpp-turboquant/src/llama-batch.h
llama-cpp-turboquant/src/llama-chat.cpp
llama-cpp-turboquant/src/llama-chat.h
llama-cpp-turboquant/src/llama-context.cpp
llama-cpp-turboquant/src/llama-context.h
llama-cpp-turboquant/src/llama-cparams.cpp
llama-cpp-turboquant/src/llama-cparams.h
llama-cpp-turboquant/src/llama-ext.h
llama-cpp-turboquant/src/llama-grammar.cpp
llama-cpp-turboquant/src/llama-grammar.h
llama-cpp-turboquant/src/llama-graph.cpp
llama-cpp-turboquant/src/llama-graph.h
llama-cpp-turboquant/src/llama-hparams.cpp
llama-cpp-turboquant/src/llama-hparams.h
llama-cpp-turboquant/src/llama-impl.cpp
llama-cpp-turboquant/src/llama-impl.h
llama-cpp-turboquant/src/llama-io.cpp
llama-cpp-turboquant/src/llama-io.h
llama-cpp-turboquant/src/llama-kv-cache-iswa.cpp
llama-cpp-turboquant/src/llama-kv-cache-iswa.h
llama-cpp-turboquant/src/llama-kv-cache.cpp
llama-cpp-turboquant/src/llama-kv-cache.h
llama-cpp-turboquant/src/llama-kv-cells.h
llama-cpp-turboquant/src/llama-memory-hybrid-iswa.cpp
llama-cpp-turboquant/src/llama-memory-hybrid-iswa.h
llama-cpp-turboquant/src/llama-memory-hybrid.cpp
llama-cpp-turboquant/src/llama-memory-hybrid.h
llama-cpp-turboquant/src/llama-memory-recurrent.cpp
llama-cpp-turboquant/src/llama-memory-recurrent.h
llama-cpp-turboquant/src/llama-memory.cpp
llama-cpp-turboquant/src/llama-memory.h
llama-cpp-turboquant/src/llama-mmap.cpp
llama-cpp-turboquant/src/llama-mmap.h
llama-cpp-turboquant/src/llama-model-loader.cpp
llama-cpp-turboquant/src/llama-model-loader.h
llama-cpp-turboquant/src/llama-model-saver.cpp
llama-cpp-turboquant/src/llama-model-saver.h
llama-cpp-turboquant/src/llama-model.cpp
llama-cpp-turboquant/src/llama-model.h
llama-cpp-turboquant/src/llama-quant.cpp
llama-cpp-turboquant/src/llama-quant.h
llama-cpp-turboquant/src/llama-sampler.cpp
llama-cpp-turboquant/src/llama-sampler.h
llama-cpp-turboquant/src/llama-vocab.cpp
llama-cpp-turboquant/src/llama-vocab.h
llama-cpp-turboquant/src/llama.cpp
llama-cpp-turboquant/src/turbo-rotation-data-32.h
llama-cpp-turboquant/src/turbo-rotation-data.h
llama-cpp-turboquant/src/unicode-data.cpp
llama-cpp-turboquant/src/unicode-data.h
llama-cpp-turboquant/src/unicode.cpp
llama-cpp-turboquant/src/unicode.h
llama-cpp-turboquant/src/models/afmoe.cpp
llama-cpp-turboquant/src/models/apertus.cpp
llama-cpp-turboquant/src/models/arcee.cpp
llama-cpp-turboquant/src/models/arctic.cpp
llama-cpp-turboquant/src/models/arwkv7.cpp
llama-cpp-turboquant/src/models/baichuan.cpp
llama-cpp-turboquant/src/models/bailingmoe.cpp
llama-cpp-turboquant/src/models/bailingmoe2.cpp
llama-cpp-turboquant/src/models/bert.cpp
llama-cpp-turboquant/src/models/bitnet.cpp
llama-cpp-turboquant/src/models/bloom.cpp
llama-cpp-turboquant/src/models/chameleon.cpp
llama-cpp-turboquant/src/models/chatglm.cpp
llama-cpp-turboquant/src/models/codeshell.cpp
llama-cpp-turboquant/src/models/cogvlm.cpp
llama-cpp-turboquant/src/models/cohere2-iswa.cpp
llama-cpp-turboquant/src/models/command-r.cpp
llama-cpp-turboquant/src/models/dbrx.cpp
llama-cpp-turboquant/src/models/deci.cpp
llama-cpp-turboquant/src/models/deepseek.cpp
llama-cpp-turboquant/src/models/deepseek2.cpp
llama-cpp-turboquant/src/models/delta-net-base.cpp
llama-cpp-turboquant/src/models/dots1.cpp
llama-cpp-turboquant/src/models/dream.cpp
llama-cpp-turboquant/src/models/ernie4-5-moe.cpp
llama-cpp-turboquant/src/models/ernie4-5.cpp
llama-cpp-turboquant/src/models/eurobert.cpp
llama-cpp-turboquant/src/models/exaone-moe.cpp
llama-cpp-turboquant/src/models/exaone.cpp
llama-cpp-turboquant/src/models/exaone4.cpp
llama-cpp-turboquant/src/models/falcon-h1.cpp
llama-cpp-turboquant/src/models/falcon.cpp
llama-cpp-turboquant/src/models/gemma-embedding.cpp
llama-cpp-turboquant/src/models/gemma.cpp
llama-cpp-turboquant/src/models/gemma2-iswa.cpp
llama-cpp-turboquant/src/models/gemma3.cpp
llama-cpp-turboquant/src/models/gemma3n-iswa.cpp
llama-cpp-turboquant/src/models/gemma4-iswa.cpp
llama-cpp-turboquant/src/models/glm4-moe.cpp
llama-cpp-turboquant/src/models/glm4.cpp
llama-cpp-turboquant/src/models/gpt2.cpp
llama-cpp-turboquant/src/models/gptneox.cpp
llama-cpp-turboquant/src/models/granite-hybrid.cpp
llama-cpp-turboquant/src/models/granite.cpp
llama-cpp-turboquant/src/models/grok.cpp
llama-cpp-turboquant/src/models/grovemoe.cpp
llama-cpp-turboquant/src/models/hunyuan-dense.cpp
llama-cpp-turboquant/src/models/hunyuan-moe.cpp
llama-cpp-turboquant/src/models/internlm2.cpp
llama-cpp-turboquant/src/models/jais.cpp
llama-cpp-turboquant/src/models/jais2.cpp
llama-cpp-turboquant/src/models/jamba.cpp
llama-cpp-turboquant/src/models/kimi-linear.cpp
llama-cpp-turboquant/src/models/lfm2.cpp
llama-cpp-turboquant/src/models/llada-moe.cpp
llama-cpp-turboquant/src/models/llada.cpp
llama-cpp-turboquant/src/models/llama-iswa.cpp
llama-cpp-turboquant/src/models/llama.cpp
llama-cpp-turboquant/src/models/maincoder.cpp
llama-cpp-turboquant/src/models/mamba-base.cpp
llama-cpp-turboquant/src/models/mamba.cpp
llama-cpp-turboquant/src/models/mimo2-iswa.cpp
llama-cpp-turboquant/src/models/minicpm3.cpp
llama-cpp-turboquant/src/models/minimax-m2.cpp
llama-cpp-turboquant/src/models/mistral3.cpp
llama-cpp-turboquant/src/models/models.h
llama-cpp-turboquant/src/models/modern-bert.cpp
llama-cpp-turboquant/src/models/mpt.cpp
llama-cpp-turboquant/src/models/nemotron-h.cpp
llama-cpp-turboquant/src/models/nemotron.cpp
llama-cpp-turboquant/src/models/neo-bert.cpp
llama-cpp-turboquant/src/models/olmo.cpp
llama-cpp-turboquant/src/models/olmo2.cpp
llama-cpp-turboquant/src/models/olmoe.cpp
llama-cpp-turboquant/src/models/openai-moe-iswa.cpp
llama-cpp-turboquant/src/models/openelm.cpp
llama-cpp-turboquant/src/models/orion.cpp
llama-cpp-turboquant/src/models/paddleocr.cpp
llama-cpp-turboquant/src/models/pangu-embedded.cpp
llama-cpp-turboquant/src/models/phi2.cpp
llama-cpp-turboquant/src/models/phi3.cpp
llama-cpp-turboquant/src/models/plamo.cpp
llama-cpp-turboquant/src/models/plamo2.cpp
llama-cpp-turboquant/src/models/plamo3.cpp
llama-cpp-turboquant/src/models/plm.cpp
llama-cpp-turboquant/src/models/qwen.cpp
llama-cpp-turboquant/src/models/qwen2.cpp
llama-cpp-turboquant/src/models/qwen2moe.cpp
llama-cpp-turboquant/src/models/qwen2vl.cpp
llama-cpp-turboquant/src/models/qwen3.cpp
llama-cpp-turboquant/src/models/qwen35.cpp
llama-cpp-turboquant/src/models/qwen35moe.cpp
llama-cpp-turboquant/src/models/qwen3moe.cpp
llama-cpp-turboquant/src/models/qwen3next.cpp
llama-cpp-turboquant/src/models/qwen3vl-moe.cpp
llama-cpp-turboquant/src/models/qwen3vl.cpp
llama-cpp-turboquant/src/models/refact.cpp
llama-cpp-turboquant/src/models/rnd1.cpp
llama-cpp-turboquant/src/models/rwkv6-base.cpp
llama-cpp-turboquant/src/models/rwkv6.cpp
llama-cpp-turboquant/src/models/rwkv6qwen2.cpp
llama-cpp-turboquant/src/models/rwkv7-base.cpp
llama-cpp-turboquant/src/models/rwkv7.cpp
llama-cpp-turboquant/src/models/seed-oss.cpp
llama-cpp-turboquant/src/models/smallthinker.cpp
llama-cpp-turboquant/src/models/smollm3.cpp
llama-cpp-turboquant/src/models/stablelm.cpp
llama-cpp-turboquant/src/models/starcoder.cpp
llama-cpp-turboquant/src/models/starcoder2.cpp
llama-cpp-turboquant/src/models/step35-iswa.cpp
llama-cpp-turboquant/src/models/t5-dec.cpp
llama-cpp-turboquant/src/models/t5-enc.cpp
llama-cpp-turboquant/src/models/wavtokenizer-dec.cpp
llama-cpp-turboquant/src/models/xverse.cpp
llama-cpp-turboquant/tools/CMakeLists.txt
llama-cpp-turboquant/tools/batched-bench/CMakeLists.txt
llama-cpp-turboquant/tools/batched-bench/batched-bench.cpp
llama-cpp-turboquant/tools/cli/CMakeLists.txt
llama-cpp-turboquant/tools/cli/cli.cpp
llama-cpp-turboquant/tools/completion/CMakeLists.txt
llama-cpp-turboquant/tools/completion/completion.cpp
llama-cpp-turboquant/tools/cvector-generator/CMakeLists.txt
llama-cpp-turboquant/tools/cvector-generator/cvector-generator.cpp
llama-cpp-turboquant/tools/cvector-generator/mean.hpp
llama-cpp-turboquant/tools/cvector-generator/pca.hpp
llama-cpp-turboquant/tools/export-lora/CMakeLists.txt
llama-cpp-turboquant/tools/export-lora/export-lora.cpp
llama-cpp-turboquant/tools/fit-params/CMakeLists.txt
llama-cpp-turboquant/tools/fit-params/fit-params.cpp
llama-cpp-turboquant/tools/gguf-split/CMakeLists.txt
llama-cpp-turboquant/tools/gguf-split/gguf-split.cpp
llama-cpp-turboquant/tools/imatrix/CMakeLists.txt
llama-cpp-turboquant/tools/imatrix/imatrix.cpp
llama-cpp-turboquant/tools/llama-bench/CMakeLists.txt
llama-cpp-turboquant/tools/llama-bench/llama-bench.cpp
llama-cpp-turboquant/tools/mtmd/CMakeLists.txt
llama-cpp-turboquant/tools/mtmd/clip-graph.h
llama-cpp-turboquant/tools/mtmd/clip-impl.h
llama-cpp-turboquant/tools/mtmd/clip-model.h
llama-cpp-turboquant/tools/mtmd/clip.cpp
llama-cpp-turboquant/tools/mtmd/clip.h
llama-cpp-turboquant/tools/mtmd/deprecation-warning.cpp
llama-cpp-turboquant/tools/mtmd/mtmd-audio.cpp
llama-cpp-turboquant/tools/mtmd/mtmd-audio.h
llama-cpp-turboquant/tools/mtmd/mtmd-cli.cpp
llama-cpp-turboquant/tools/mtmd/mtmd-helper.cpp
llama-cpp-turboquant/tools/mtmd/mtmd-helper.h
llama-cpp-turboquant/tools/mtmd/mtmd-image.cpp
llama-cpp-turboquant/tools/mtmd/mtmd-image.h
llama-cpp-turboquant/tools/mtmd/mtmd.cpp
llama-cpp-turboquant/tools/mtmd/mtmd.h
llama-cpp-turboquant/tools/mtmd/debug/mtmd-debug.cpp
llama-cpp-turboquant/tools/mtmd/debug/mtmd-debug.h
llama-cpp-turboquant/tools/mtmd/models/cogvlm.cpp
llama-cpp-turboquant/tools/mtmd/models/conformer.cpp
llama-cpp-turboquant/tools/mtmd/models/deepseekocr.cpp
llama-cpp-turboquant/tools/mtmd/models/gemma4v.cpp
llama-cpp-turboquant/tools/mtmd/models/glm4v.cpp
llama-cpp-turboquant/tools/mtmd/models/hunyuanocr.cpp
llama-cpp-turboquant/tools/mtmd/models/internvl.cpp
llama-cpp-turboquant/tools/mtmd/models/kimik25.cpp
llama-cpp-turboquant/tools/mtmd/models/kimivl.cpp
llama-cpp-turboquant/tools/mtmd/models/llama4.cpp
llama-cpp-turboquant/tools/mtmd/models/llava.cpp
llama-cpp-turboquant/tools/mtmd/models/minicpmv.cpp
llama-cpp-turboquant/tools/mtmd/models/mobilenetv5.cpp
llama-cpp-turboquant/tools/mtmd/models/models.h
llama-cpp-turboquant/tools/mtmd/models/nemotron-v2-vl.cpp
llama-cpp-turboquant/tools/mtmd/models/paddleocr.cpp
llama-cpp-turboquant/tools/mtmd/models/pixtral.cpp
llama-cpp-turboquant/tools/mtmd/models/qwen2vl.cpp
llama-cpp-turboquant/tools/mtmd/models/qwen3vl.cpp
llama-cpp-turboquant/tools/mtmd/models/siglip.cpp
llama-cpp-turboquant/tools/mtmd/models/whisper-enc.cpp
llama-cpp-turboquant/tools/mtmd/models/youtuvl.cpp
llama-cpp-turboquant/tools/parser/CMakeLists.txt
llama-cpp-turboquant/tools/parser/debug-template-parser.cpp
llama-cpp-turboquant/tools/parser/template-analysis.cpp
llama-cpp-turboquant/tools/perplexity/CMakeLists.txt
llama-cpp-turboquant/tools/perplexity/perplexity.cpp
llama-cpp-turboquant/tools/quantize/CMakeLists.txt
llama-cpp-turboquant/tools/quantize/quantize.cpp
llama-cpp-turboquant/tools/results/CMakeLists.txt
llama-cpp-turboquant/tools/results/results.cpp
llama-cpp-turboquant/tools/rpc/CMakeLists.txt
llama-cpp-turboquant/tools/rpc/rpc-server.cpp
llama-cpp-turboquant/tools/server/CMakeLists.txt
llama-cpp-turboquant/tools/server/server-common.cpp
llama-cpp-turboquant/tools/server/server-common.h
llama-cpp-turboquant/tools/server/server-context.cpp
llama-cpp-turboquant/tools/server/server-context.h
llama-cpp-turboquant/tools/server/server-cors-proxy.h
llama-cpp-turboquant/tools/server/server-http.cpp
llama-cpp-turboquant/tools/server/server-http.h
llama-cpp-turboquant/tools/server/server-models.cpp
llama-cpp-turboquant/tools/server/server-models.h
llama-cpp-turboquant/tools/server/server-queue.cpp
llama-cpp-turboquant/tools/server/server-queue.h
llama-cpp-turboquant/tools/server/server-task.cpp
llama-cpp-turboquant/tools/server/server-task.h
llama-cpp-turboquant/tools/server/server-tools.cpp
llama-cpp-turboquant/tools/server/server-tools.h
llama-cpp-turboquant/tools/server/server.cpp
llama-cpp-turboquant/tools/tokenize/CMakeLists.txt
llama-cpp-turboquant/tools/tokenize/tokenize.cpp
llama-cpp-turboquant/tools/tts/CMakeLists.txt
llama-cpp-turboquant/tools/tts/tts.cpp
llama-cpp-turboquant/vendor/cpp-httplib/CMakeLists.txt
llama-cpp-turboquant/vendor/cpp-httplib/httplib.cpp
llama-cpp-turboquant/vendor/cpp-httplib/httplib.h
llama-cpp-turboquant/vendor/miniaudio/miniaudio.h
llama-cpp-turboquant/vendor/nlohmann/json.hpp
llama-cpp-turboquant/vendor/nlohmann/json_fwd.hpp
llama-cpp-turboquant/vendor/sheredom/subprocess.h
llama-cpp-turboquant/vendor/stb/stb_image.h
src/localcode/__init__.py
src/localcode/__main__.py
src/localcode/_subproc_env.py
src/localcode/app.py
src/localcode/approvals.py
src/localcode/auto_compact.py
src/localcode/autonomy.py
src/localcode/bootstrap.py
src/localcode/cache.py
src/localcode/compact.py
src/localcode/compaction.py
src/localcode/composer.py
src/localcode/config.py
src/localcode/context.py
src/localcode/display.py
src/localcode/embeddings.py
src/localcode/entrypoint.py
src/localcode/errors.py
src/localcode/events.py
src/localcode/features.py
src/localcode/formatting.py
src/localcode/health.py
src/localcode/history.py
src/localcode/hooks.py
src/localcode/indexer.py
src/localcode/injection_defense.py
src/localcode/launcher.py
src/localcode/logging_utils.py
src/localcode/lsp.py
src/localcode/mcp.py
src/localcode/memory_guard.py
src/localcode/model_families.py
src/localcode/models.py
src/localcode/models_catalog.py
src/localcode/notebook.py
src/localcode/output.py
src/localcode/patching.py
src/localcode/paths.py
src/localcode/performance.py
src/localcode/permissions.py
src/localcode/permissions_v2.py
src/localcode/plans.py
src/localcode/process_registry.py
src/localcode/recovery.py
src/localcode/runtime.py
src/localcode/server_manager.py
src/localcode/session.py
src/localcode/shell.py
src/localcode/skills.py
src/localcode/snapshots.py
src/localcode/sounds.py
src/localcode/telemetry.py
src/localcode/theme.py
src/localcode/thinking.py
src/localcode/tool_parsing.py
src/localcode/tool_router.py
src/localcode/toolkit.py
src/localcode/turn_diff.py
src/localcode/undo.py
src/localcode/verification.py
src/localcode/voice.py
src/localcode.egg-info/PKG-INFO
src/localcode.egg-info/SOURCES.txt
src/localcode.egg-info/dependency_links.txt
src/localcode.egg-info/entry_points.txt
src/localcode.egg-info/requires.txt
src/localcode.egg-info/top_level.txt
src/localcode/agent/__init__.py
src/localcode/agent/app_tasks.py
src/localcode/agent/constants.py
src/localcode/agent/context.py
src/localcode/agent/goal.py
src/localcode/agent/helpers.py
src/localcode/agent/hooks.py
src/localcode/agent/loop.py
src/localcode/agent/prompt_context.py
src/localcode/agent/prompts.py
src/localcode/agent/recovery.py
src/localcode/agent/sections.py
src/localcode/agent/streaming.py
src/localcode/agent/tool_execution.py
src/localcode/agent/tool_orchestration.py
src/localcode/agent/turn_finalization.py
src/localcode/bin/__init__.py
src/localcode/bin/llama-server
src/localcode/skills/debug.md
src/localcode/skills/edit-verified.md
src/localcode/skills/explain.md
src/localcode/skills/git-commit-safely.md
src/localcode/skills/locate.md
src/localcode/skills/plan-task.md
src/localcode/skills/review.md
src/localcode/skills/run-tests.md
src/localcode/tools/__init__.py
src/localcode/tools/agent.py
src/localcode/tools/append_file.py
src/localcode/tools/base.py
src/localcode/tools/bash.py
src/localcode/tools/edit_diff.py
src/localcode/tools/edit_file.py
src/localcode/tools/facts.py
src/localcode/tools/glob_tool.py
src/localcode/tools/grep.py
src/localcode/tools/launch_app.py
src/localcode/tools/list_files.py
src/localcode/tools/multi_edit.py
src/localcode/tools/plan_mode.py
src/localcode/tools/read_file.py
src/localcode/tools/skill_tool.py
src/localcode/tools/web_fetch.py
src/localcode/tools/web_search.py
src/localcode/tools/write_file.py
src/localcode/tui/__init__.py
src/localcode/tui/app.py
src/localcode/tui/bridge.py
src/localcode/tui/screens/__init__.py
src/localcode/tui/screens/chat.py
src/localcode/tui/screens/mode_picker.py
src/localcode/tui/screens/model_picker.py
src/localcode/tui/screens/setup.py
src/localcode/tui/styles/__init__.py
src/localcode/tui/styles/app.tcss
src/localcode/tui/widgets/__init__.py
src/localcode/tui/widgets/approval.py
src/localcode/tui/widgets/chat_log.py
src/localcode/tui/widgets/voice_visualizer.py
src/localcode/tui/widgets/messages/__init__.py
src/localcode/tui/widgets/messages/diff.py
tests/test_agent_event_regressions.py
tests/test_architecture.py
tests/test_bootstrap.py
tests/test_comprehensive_agent.py
tests/test_comprehensive_cli.py
tests/test_comprehensive_download.py
tests/test_comprehensive_install.py
tests/test_comprehensive_machines.py
tests/test_comprehensive_tui.py
tests/test_comprehensive_vision.py
tests/test_comprehensive_voice.py
tests/test_comprehensive_whisper.py
tests/test_config.py
tests/test_context.py
tests/test_context_pipeline_e2e.py
tests/test_download.py
tests/test_fresh_install.py
tests/test_humaneval.py
tests/test_output.py
tests/test_runtime.py
tests/test_subproc_env.py
tests/test_toolkit.py
tests/test_tui_input.py