LICENSE
README.md
pyproject.toml
benchmark/llama3-8b-gptq/quant_benchmark.py
benchmark/llama3-8b-jointq/quant_benchmark.py
benchmark/llama3-8b-qep-gptq/quant_benchmark.py
benchmark/llama3-8b-various/quant_benchmark.py
benchmark/qwen3-14b-gptq/quant_benchmark.py
benchmark/qwen3-14b-jointq/quant_benchmark.py
benchmark/qwen3-8b-gptq/quant_benchmark.py
benchmark/qwen3-8b-jointq/quant_benchmark.py
example/example_auto_run.py
example/example_autobit.py
example/example_gptq.py
example/example_jointq.py
example/example_qep_gptq.py
example/example_save_load.py
example/post_process/example_lora_sft.py
example/post_process/example_lora_sft_knowledge.py
example/pre_process/example_llama_preprocess_rtn.py
example/pre_process/example_preprocess_save_load.py
example/vllm_inference/example_autobit_vllm_inference.py
example/vllm_inference/example_gptq_vllm_inference.py
onecomp/__init__.py
onecomp/__main__.py
onecomp/__version__.py
onecomp/cli.py
onecomp/log.py
onecomp/model_config.py
onecomp/quantized_model_loader.py
onecomp/rotated_model_config.py
onecomp/runner.py
onecomp.egg-info/PKG-INFO
onecomp.egg-info/SOURCES.txt
onecomp.egg-info/dependency_links.txt
onecomp.egg-info/entry_points.txt
onecomp.egg-info/requires.txt
onecomp.egg-info/top_level.txt
onecomp/analyzer/__init__.py
onecomp/analyzer/cumulative_error.py
onecomp/analyzer/weight_outlier.py
onecomp/post_process/__init__.py
onecomp/post_process/_base.py
onecomp/post_process/blockwise_ptq.py
onecomp/post_process/post_process_lora_sft.py
onecomp/pre_process/__init__.py
onecomp/pre_process/hadamard_utils.py
onecomp/pre_process/modeling_llama.py
onecomp/pre_process/modeling_qwen3.py
onecomp/pre_process/optimizer.py
onecomp/pre_process/prepare_rotated_model.py
onecomp/pre_process/preprocess_args.py
onecomp/pre_process/quant_models.py
onecomp/pre_process/rotation_utils.py
onecomp/pre_process/train_rotation.py
onecomp/qep/__init__.py
onecomp/qep/_qep_config.py
onecomp/qep/_quantize_with_qep.py
onecomp/qep/_quantize_with_qep_arch.py
onecomp/quantizer/__init__.py
onecomp/quantizer/_quantizer.py
onecomp/quantizer/gemlite.py
onecomp/quantizer/arb/__init__.py
onecomp/quantizer/arb/_arb.py
onecomp/quantizer/arb/arb_impl.py
onecomp/quantizer/autobit/__init__.py
onecomp/quantizer/autobit/_autobit.py
onecomp/quantizer/autobit/activation_stats.py
onecomp/quantizer/autobit/dbf_fallback.py
onecomp/quantizer/autobit/ilp.py
onecomp/quantizer/autobit/manual.py
onecomp/quantizer/autobit/visualize.py
onecomp/quantizer/cq/__init__.py
onecomp/quantizer/cq/_cq.py
onecomp/quantizer/cq/cq_impl.py
onecomp/quantizer/dbf/__init__.py
onecomp/quantizer/dbf/_dbf.py
onecomp/quantizer/dbf/admm_extended.py
onecomp/quantizer/dbf/balance.py
onecomp/quantizer/dbf/config.py
onecomp/quantizer/dbf/dbf_impl.py
onecomp/quantizer/dbf/dbf_layer.py
onecomp/quantizer/dbf/dbf_original.py
onecomp/quantizer/dbf/fine_tune.py
onecomp/quantizer/dbf/middle.py
onecomp/quantizer/gptq/__init__.py
onecomp/quantizer/gptq/_gptq.py
onecomp/quantizer/gptq/config.py
onecomp/quantizer/gptq/gptq_layer.py
onecomp/quantizer/jointq/__init__.py
onecomp/quantizer/jointq/_jointq.py
onecomp/quantizer/jointq/core/__init__.py
onecomp/quantizer/jointq/core/__version__.py
onecomp/quantizer/jointq/core/clip.py
onecomp/quantizer/jointq/core/gptq.py
onecomp/quantizer/jointq/core/local_search.py
onecomp/quantizer/jointq/core/quantize.py
onecomp/quantizer/jointq/core/quantize_multi_gpu.py
onecomp/quantizer/jointq/core/quantizer.py
onecomp/quantizer/jointq/core/solution.py
onecomp/quantizer/jointq/core/error_propagation/__init__.py
onecomp/quantizer/jointq/core/error_propagation/local_search_advanced.py
onecomp/quantizer/jointq/core/error_propagation/quantize_advanced.py
onecomp/quantizer/jointq/core/error_propagation/quantizer_advanced.py
onecomp/quantizer/onebit/__init__.py
onecomp/quantizer/onebit/_onebit.py
onecomp/quantizer/onebit/onebit_impl.py
onecomp/quantizer/onebit/onebit_layer.py
onecomp/quantizer/qbb/__init__.py
onecomp/quantizer/qbb/_qbb.py
onecomp/quantizer/qbb/qbb_impl.py
onecomp/quantizer/quip/__init__.py
onecomp/quantizer/quip/_quip.py
onecomp/quantizer/quip/quant_quip.py
onecomp/quantizer/quip/quip_impl.py
onecomp/quantizer/quip/utils.py
onecomp/quantizer/quip/utils_had.py
onecomp/quantizer/quip/vector_balance.py
onecomp/quantizer/rtn/__init__.py
onecomp/quantizer/rtn/_rtn.py
onecomp/quantizer/rtn/quantizer.py
onecomp/quantizer/rtn/rtn_impl.py
onecomp/runner_methods/__init__.py
onecomp/runner_methods/chunked_quantization.py
onecomp/runner_methods/jointq_error_propagation.py
onecomp/runner_methods/multi_gpu_quantization.py
onecomp/utils/__init__.py
onecomp/utils/accuracy.py
onecomp/utils/activation_capture.py
onecomp/utils/activation_check.py
onecomp/utils/blockwise.py
onecomp/utils/calibration.py
onecomp/utils/perplexity.py
onecomp/utils/quant_config.py
onecomp/utils/vram_estimator.py
vllm_plugins/__init__.py
vllm_plugins/dbf/__init__.py
vllm_plugins/dbf/vllm_plugin.py
vllm_plugins/dbf/modules/__init__.py
vllm_plugins/dbf/modules/gemlite_linear.py
vllm_plugins/dbf/modules/naive.py
vllm_plugins/gptq/__init__.py
vllm_plugins/gptq/vllm_plugin.py
vllm_plugins/utils/__init__.py
vllm_plugins/utils/module.py