.coderabbit.yaml
.gitignore
LICENSE
Makefile
README.md
pyproject.toml
pytest-xpu.ini
setup.cfg
setup.py
.claude/skills/style.md
.claude/skills/test.md
.github/.gitkeep
.github/mergify.yml
.github/actions/test/action.yml
.github/scripts/step-status
.github/workflows/quality-check.yaml
.github/workflows/stale.yml
.github/workflows/test-check.yaml
examples/bit_packing/ex_quantize_and_pack.py
examples/bit_packing/int4_config.json
examples/convert_checkpoint/deepseek32_fpblock_example.py
examples/convert_checkpoint/qwen3_fpblock_example.py
examples/convert_checkpoint/qwen3_nvfp4_example.py
examples/llama_1.1b/ex_config_quantization.py
examples/llama_1.1b/ex_llmcompressor_quantization.py
examples/llama_1.1b/example_quant_config.json
examples/llama_1.1b/example_quant_recipe.yaml
src/__init__.py
src/compressed_tensors/__init__.py
src/compressed_tensors/base.py
src/compressed_tensors/logger.py
src/compressed_tensors/version.py
src/compressed_tensors.egg-info/PKG-INFO
src/compressed_tensors.egg-info/SOURCES.txt
src/compressed_tensors.egg-info/dependency_links.txt
src/compressed_tensors.egg-info/requires.txt
src/compressed_tensors.egg-info/top_level.txt
src/compressed_tensors/compressors/__init__.py
src/compressed_tensors/compressors/base.py
src/compressed_tensors/compressors/format.py
src/compressed_tensors/compressors/mx_utils.py
src/compressed_tensors/compressors/dense/__init__.py
src/compressed_tensors/compressors/dense/base.py
src/compressed_tensors/compressors/model_compressors/__init__.py
src/compressed_tensors/compressors/model_compressors/model_compressor.py
src/compressed_tensors/compressors/mxfp4/__init__.py
src/compressed_tensors/compressors/mxfp4/base.py
src/compressed_tensors/compressors/mxfp8/__init__.py
src/compressed_tensors/compressors/mxfp8/base.py
src/compressed_tensors/compressors/naive_quantized/__init__.py
src/compressed_tensors/compressors/naive_quantized/base.py
src/compressed_tensors/compressors/nvfp4/__init__.py
src/compressed_tensors/compressors/nvfp4/base.py
src/compressed_tensors/compressors/nvfp4/helpers.py
src/compressed_tensors/compressors/pack_quantized/__init__.py
src/compressed_tensors/compressors/pack_quantized/base.py
src/compressed_tensors/compressors/pack_quantized/helpers.py
src/compressed_tensors/config/__init__.py
src/compressed_tensors/config/base.py
src/compressed_tensors/config/dense.py
src/compressed_tensors/config/sparse_24_bitmask.py
src/compressed_tensors/config/sparse_bitmask.py
src/compressed_tensors/distributed/README.md
src/compressed_tensors/distributed/__init__.py
src/compressed_tensors/distributed/assign.py
src/compressed_tensors/distributed/module_parallel.py
src/compressed_tensors/distributed/utils.py
src/compressed_tensors/entrypoints/__init__.py
src/compressed_tensors/entrypoints/convert/README.md
src/compressed_tensors/entrypoints/convert/__init__.py
src/compressed_tensors/entrypoints/convert/convert_checkpoint.py
src/compressed_tensors/entrypoints/convert/convert_file.py
src/compressed_tensors/entrypoints/convert/converters/__init__.py
src/compressed_tensors/entrypoints/convert/converters/base.py
src/compressed_tensors/entrypoints/convert/converters/fp8block_dequantizer.py
src/compressed_tensors/entrypoints/convert/converters/modelopt_nvfp4.py
src/compressed_tensors/linear/__init__.py
src/compressed_tensors/linear/compressed_linear.py
src/compressed_tensors/modeling/__init__.py
src/compressed_tensors/modeling/attention.py
src/compressed_tensors/modeling/kvcache.py
src/compressed_tensors/offload/README.md
src/compressed_tensors/offload/__init__.py
src/compressed_tensors/offload/dispatch.py
src/compressed_tensors/offload/dist_utils.py
src/compressed_tensors/offload/load.py
src/compressed_tensors/offload/module.py
src/compressed_tensors/offload/utils.py
src/compressed_tensors/offload/cache/__init__.py
src/compressed_tensors/offload/cache/base.py
src/compressed_tensors/offload/cache/cpu.py
src/compressed_tensors/offload/cache/device.py
src/compressed_tensors/offload/cache/disk.py
src/compressed_tensors/offload/cache/dist_cpu.py
src/compressed_tensors/offload/cache/dist_device.py
src/compressed_tensors/offload/cache/dist_disk.py
src/compressed_tensors/offload/cache/utils.py
src/compressed_tensors/offload/convert/__init__.py
src/compressed_tensors/offload/convert/from_accelerate.py
src/compressed_tensors/offload/convert/helpers.py
src/compressed_tensors/offload/convert/to_accelerate.py
src/compressed_tensors/quantization/__init__.py
src/compressed_tensors/quantization/quant_args.py
src/compressed_tensors/quantization/quant_config.py
src/compressed_tensors/quantization/quant_metadata.py
src/compressed_tensors/quantization/quant_scheme.py
src/compressed_tensors/quantization/lifecycle/__init__.py
src/compressed_tensors/quantization/lifecycle/apply.py
src/compressed_tensors/quantization/lifecycle/compressed.py
src/compressed_tensors/quantization/lifecycle/forward.py
src/compressed_tensors/quantization/lifecycle/forward_helpers.py
src/compressed_tensors/quantization/lifecycle/helpers.py
src/compressed_tensors/quantization/lifecycle/initialize.py
src/compressed_tensors/quantization/utils/__init__.py
src/compressed_tensors/quantization/utils/helpers.py
src/compressed_tensors/quantization/utils/mxfp_utils.py
src/compressed_tensors/registry/__init__.py
src/compressed_tensors/registry/registry.py
src/compressed_tensors/transform/__init__.py
src/compressed_tensors/transform/apply.py
src/compressed_tensors/transform/transform_args.py
src/compressed_tensors/transform/transform_config.py
src/compressed_tensors/transform/transform_scheme.py
src/compressed_tensors/transform/factory/__init__.py
src/compressed_tensors/transform/factory/base.py
src/compressed_tensors/transform/factory/hadamard.py
src/compressed_tensors/transform/factory/matrix_multiply.py
src/compressed_tensors/transform/factory/random_hadamard.py
src/compressed_tensors/transform/utils/__init__.py
src/compressed_tensors/transform/utils/hadamard.py
src/compressed_tensors/transform/utils/hadamards.safetensors
src/compressed_tensors/transform/utils/matrix.py
src/compressed_tensors/utils/__init__.py
src/compressed_tensors/utils/binary_search.py
src/compressed_tensors/utils/helpers.py
src/compressed_tensors/utils/internal.py
src/compressed_tensors/utils/match.py
src/compressed_tensors/utils/module.py
src/compressed_tensors/utils/mtp.py
src/compressed_tensors/utils/offload.py
src/compressed_tensors/utils/permutations_24.py
src/compressed_tensors/utils/safetensors_load.py
src/compressed_tensors/utils/semi_structured_conversions.py
src/compressed_tensors/utils/type.py
tests/__init__.py
tests/conftest.py
tests/emulate_device.py
tests/mock_observer.py
tests/testing_utils.py
tests/test_compressors/test_compress_decompress_module.py
tests/test_compressors/test_fp4_quant.py
tests/test_compressors/test_fp8_quant.py
tests/test_compressors/test_int_quant.py
tests/test_compressors/test_mxfp4_quant.py
tests/test_compressors/test_mxfp8_quant.py
tests/test_compressors/test_pack_quant.py
tests/test_compressors/test_packed_asym_decompression.py
tests/test_compressors/distributed/test_distributed_compression.py
tests/test_compressors/distributed/test_module_parallel.py
tests/test_compressors/model_compressors/test_model_compressor.py
tests/test_compressors/model_compressors/test_model_compressor_distributed.py
tests/test_compressors/model_compressors/test_transformers_integration.py
tests/test_configs/__init__.py
tests/test_configs/test_base.py
tests/test_configs/test_infer_quant.py
tests/test_entrypoints/convert/converters/test_build_inverse_weight_maps.py
tests/test_entrypoints/convert/converters/test_fp8block_dequantizer.py
tests/test_examples/test_bitmask_compression_ipynb.py
tests/test_modeling/test_attention_and_cache.py
tests/test_modeling/test_deepseekv3_kvcache_quant.py
tests/test_offload/conftest.py
tests/test_offload/test_dispatch.py
tests/test_offload/test_interface.py
tests/test_offload/test_load.py
tests/test_offload/test_module.py
tests/test_offload/test_xpu_routing.py
tests/test_offload/cache/conftest.py
tests/test_offload/cache/helpers.py
tests/test_offload/cache/test_cpu.py
tests/test_offload/cache/test_device.py
tests/test_offload/cache/test_disk.py
tests/test_offload/cache/test_dist_cpu.py
tests/test_offload/cache/test_dist_device.py
tests/test_offload/cache/test_dist_disk.py
tests/test_offload/convert/test_convert.py
tests/test_offload/convert/test_from_accelerate.py
tests/test_offload/convert/test_to_accelerate.py
tests/test_quantization/__init__.py
tests/test_quantization/test_quant_args.py
tests/test_quantization/test_quant_config.py
tests/test_quantization/test_quant_metadata.py
tests/test_quantization/test_quant_scheme.py
tests/test_quantization/lifecycle/__init__.py
tests/test_quantization/lifecycle/conftest.py
tests/test_quantization/lifecycle/test_apply.py
tests/test_quantization/lifecycle/test_dynamic_lifecycle.py
tests/test_quantization/lifecycle/test_enabled.py
tests/test_quantization/lifecycle/test_forward.py
tests/test_quantization/lifecycle/test_initialize.py
tests/test_quantization/lifecycle/test_lifecycle.py
tests/test_quantization/lifecycle/test_static_lifecycle.py
tests/test_quantization/test_configs/__init__.py
tests/test_quantization/test_configs/test_bit_depths.py
tests/test_quantization/test_configs/test_compression_format.py
tests/test_quantization/test_configs/test_strategies.py
tests/test_quantization/test_utils/test_helpers.py
tests/test_quantization/test_utils/test_mxfp4_utils.py
tests/test_quantization/test_utils/test_mxfp8_utils.py
tests/test_transform/conftest.py
tests/test_transform/test_transform_args.py
tests/test_transform/test_transform_config.py
tests/test_transform/test_transform_scheme.py
tests/test_transform/factory/test_correctness.py
tests/test_transform/factory/test_memory.py
tests/test_transform/factory/test_serialization.py
tests/test_transform/utils/test_hadamard.py
tests/test_utils/__init__.py
tests/test_utils/test_helpers.py
tests/test_utils/test_match.py
tests/test_utils/test_safetensors_load.py
tests/test_utils/test_save_mtp_tensors.py
tests/test_utils/test_type.py
utils/copyright.py