LICENSE
README.md
pyproject.toml
VeloxQuant_MLX.egg-info/PKG-INFO
VeloxQuant_MLX.egg-info/SOURCES.txt
VeloxQuant_MLX.egg-info/dependency_links.txt
VeloxQuant_MLX.egg-info/entry_points.txt
VeloxQuant_MLX.egg-info/requires.txt
VeloxQuant_MLX.egg-info/top_level.txt
mlx_kv_quant/__init__.py
mlx_kv_quant/__main__.py
mlx_kv_quant/artifacts/__init__.py
mlx_kv_quant/artifacts/base.py
mlx_kv_quant/artifacts/memory_store.py
mlx_kv_quant/artifacts/npy_store.py
mlx_kv_quant/benchmarks/__init__.py
mlx_kv_quant/benchmarks/attend_benchmark.py
mlx_kv_quant/cache/__init__.py
mlx_kv_quant/cache/base.py
mlx_kv_quant/cache/polar_cache.py
mlx_kv_quant/cache/qjl_cache.py
mlx_kv_quant/cache/sliding_window_cache.py
mlx_kv_quant/cache/turboquant_cache.py
mlx_kv_quant/cli/__init__.py
mlx_kv_quant/cli/benchmark.py
mlx_kv_quant/cli/precompute.py
mlx_kv_quant/codebooks/__init__.py
mlx_kv_quant/codebooks/adaptive_codebook.py
mlx_kv_quant/codebooks/base.py
mlx_kv_quant/codebooks/precompute.py
mlx_kv_quant/codebooks/scalar_codebook.py
mlx_kv_quant/codebooks/strategies.py
mlx_kv_quant/core/__init__.py
mlx_kv_quant/core/abstractions.py
mlx_kv_quant/core/constants.py
mlx_kv_quant/core/context.py
mlx_kv_quant/core/exceptions.py
mlx_kv_quant/core/registry.py
mlx_kv_quant/dsa/__init__.py
mlx_kv_quant/dsa/avl_tree.py
mlx_kv_quant/dsa/bit_pack.py
mlx_kv_quant/dsa/dag.py
mlx_kv_quant/dsa/heap.py
mlx_kv_quant/dsa/ring_buffer.py
mlx_kv_quant/handlers/__init__.py
mlx_kv_quant/handlers/base.py
mlx_kv_quant/handlers/bit_pack_handler.py
mlx_kv_quant/handlers/normalization.py
mlx_kv_quant/handlers/outlier_split.py
mlx_kv_quant/handlers/polar_handler.py
mlx_kv_quant/handlers/qjl_residual_handler.py
mlx_kv_quant/handlers/rotation_handler.py
mlx_kv_quant/handlers/scalar_quant_handler.py
mlx_kv_quant/handlers/value_quant_handler.py
mlx_kv_quant/integration/__init__.py
mlx_kv_quant/integration/mlx_lm_patch.py
mlx_kv_quant/math/__init__.py
mlx_kv_quant/math/distributions.py
mlx_kv_quant/math/lloyd_max.py
mlx_kv_quant/math/rotation.py
mlx_kv_quant/observers/__init__.py
mlx_kv_quant/observers/base.py
mlx_kv_quant/observers/distortion.py
mlx_kv_quant/observers/latency.py
mlx_kv_quant/observers/memory.py
mlx_kv_quant/outlier/__init__.py
mlx_kv_quant/outlier/detector.py
mlx_kv_quant/preconditioners/__init__.py
mlx_kv_quant/preconditioners/base.py
mlx_kv_quant/preconditioners/jl_sketch.py
mlx_kv_quant/preconditioners/rotation.py
mlx_kv_quant/quantizers/__init__.py
mlx_kv_quant/quantizers/base.py
mlx_kv_quant/quantizers/composite.py
mlx_kv_quant/quantizers/polarquant.py
mlx_kv_quant/quantizers/qjl.py
mlx_kv_quant/quantizers/turboquant_mse.py
mlx_kv_quant/quantizers/turboquant_prod.py
mlx_kv_quant/quantizers/turboquant_rvq.py
mlx_kv_quant/tests/__init__.py
mlx_kv_quant/tests/conftest.py
mlx_kv_quant/tests/cache/__init__.py
mlx_kv_quant/tests/cache/test_sliding_window.py
mlx_kv_quant/tests/cache/test_turboquant_cache.py
mlx_kv_quant/tests/dsa/__init__.py
mlx_kv_quant/tests/dsa/test_avl_tree.py
mlx_kv_quant/tests/dsa/test_bit_pack.py
mlx_kv_quant/tests/dsa/test_dag.py
mlx_kv_quant/tests/dsa/test_heap.py
mlx_kv_quant/tests/dsa/test_ring_buffer.py
mlx_kv_quant/tests/handlers/__init__.py
mlx_kv_quant/tests/handlers/test_pipeline.py
mlx_kv_quant/tests/integration/__init__.py
mlx_kv_quant/tests/integration/test_distortion_bounds.py
mlx_kv_quant/tests/math/__init__.py
mlx_kv_quant/tests/math/test_distributions.py
mlx_kv_quant/tests/math/test_lloyd_max.py
mlx_kv_quant/tests/quantizers/__init__.py
mlx_kv_quant/tests/quantizers/test_polar.py
mlx_kv_quant/tests/quantizers/test_qjl.py
mlx_kv_quant/tests/quantizers/test_turboquant_mse.py
mlx_kv_quant/tests/quantizers/test_turboquant_prod.py
mlx_kv_quant/transforms/__init__.py
mlx_kv_quant/transforms/base.py
mlx_kv_quant/transforms/polar.py
mlx_kv_quant/weight/__init__.py
mlx_kv_quant/weight/model_quantizer.py
mlx_kv_quant/weight/quantized_linear.py