LICENSE
MANIFEST.in
README.md
pyproject.toml
requirements-cpu.txt
requirements-hpu.txt
requirements.txt
setup.cfg
setup.py
third-party-programs.txt
auto_round/__init__.py
auto_round/__main__.py
auto_round/alg_ext.py
auto_round/autoround.py
auto_round/calib_dataset.py
auto_round/envs.py
auto_round/formats.py
auto_round/logger.py
auto_round/schemes.py
auto_round/sign_sgd.py
auto_round/special_model_handler.py
auto_round/version.py
auto_round/wrapper.py
auto_round.egg-info/PKG-INFO
auto_round.egg-info/SOURCES.txt
auto_round.egg-info/dependency_links.txt
auto_round.egg-info/entry_points.txt
auto_round.egg-info/requires.txt
auto_round.egg-info/top_level.txt
auto_round/auto_scheme/__init__.py
auto_round/auto_scheme/delta_loss.py
auto_round/auto_scheme/gen_auto_scheme.py
auto_round/auto_scheme/register.py
auto_round/auto_scheme/utils.py
auto_round/compressors/__init__.py
auto_round/compressors/adam.py
auto_round/compressors/base.py
auto_round/compressors/config.py
auto_round/compressors/shard_writer.py
auto_round/compressors/utils.py
auto_round/compressors/diffusion/__init__.py
auto_round/compressors/diffusion/compressor.py
auto_round/compressors/diffusion/dataset.py
auto_round/compressors/diffusion/eval.py
auto_round/compressors/diffusion/hybrid.py
auto_round/compressors/mllm/__init__.py
auto_round/compressors/mllm/compressor.py
auto_round/compressors/mllm/dataset.py
auto_round/compressors/mllm/eval.py
auto_round/compressors/mllm/processor.py
auto_round/compressors/mllm/template.py
auto_round/compressors/mllm/utils.py
auto_round/compressors/mllm/templates/cogvlm2.json
auto_round/compressors/mllm/templates/default.json
auto_round/compressors/mllm/templates/llava.json
auto_round/compressors/mllm/templates/phi3_v.json
auto_round/data_type/__init__.py
auto_round/data_type/fp8.py
auto_round/data_type/gguf.py
auto_round/data_type/int.py
auto_round/data_type/mxfp.py
auto_round/data_type/nvfp.py
auto_round/data_type/register.py
auto_round/data_type/utils.py
auto_round/data_type/w4fp8.py
auto_round/eval/__init__.py
auto_round/eval/eval_cli.py
auto_round/eval/evaluation.py
auto_round/experimental/__init__.py
auto_round/experimental/attention.py
auto_round/experimental/kv_cache.py
auto_round/experimental/utils.py
auto_round/experimental/qmodules/__init__.py
auto_round/experimental/qmodules/base.py
auto_round/experimental/qmodules/fp4_utils.py
auto_round/experimental/qmodules/fp8_static.py
auto_round/experimental/qmodules/mx.py
auto_round/experimental/qmodules/nvfp4.py
auto_round/experimental/transform/__init__.py
auto_round/experimental/transform/apply.py
auto_round/experimental/transform/hadamard_config.py
auto_round/experimental/transform/hadamards.py
auto_round/experimental/transform/patch_modules.py
auto_round/experimental/transform/triton/__init__.py
auto_round/experimental/transform/triton/mxfp4.py
auto_round/experimental/transform/utils/__init__.py
auto_round/experimental/transform/utils/hadamard.py
auto_round/experimental/transform/utils/hadamards.safetensors
auto_round/experimental/transform/utils/matrix.py
auto_round/export/__init__.py
auto_round/export/utils.py
auto_round/export/export_to_autogptq/__init__.py
auto_round/export/export_to_autogptq/export.py
auto_round/export/export_to_autogptq/qlinear_triton.py
auto_round/export/export_to_autoround/__init__.py
auto_round/export/export_to_autoround/export.py
auto_round/export/export_to_autoround/export_to_fp8.py
auto_round/export/export_to_autoround/export_to_nvfp_mxfp.py
auto_round/export/export_to_autoround/qlinear_fp.py
auto_round/export/export_to_autoround/qlinear_triton_act.py
auto_round/export/export_to_autoround/utils.py
auto_round/export/export_to_awq/__init__.py
auto_round/export/export_to_awq/export.py
auto_round/export/export_to_awq/utils.py
auto_round/export/export_to_gguf/__init__.py
auto_round/export/export_to_gguf/config.py
auto_round/export/export_to_gguf/convert.py
auto_round/export/export_to_gguf/convert_hf_to_gguf.py
auto_round/export/export_to_gguf/export.py
auto_round/export/export_to_gguf/packing.py
auto_round/export/export_to_gguf/special_handle.py
auto_round/export/export_to_llmcompressor/__init__.py
auto_round/export/export_to_llmcompressor/config.py
auto_round/export/export_to_llmcompressor/export.py
auto_round/export/export_to_llmcompressor/export_to_fp.py
auto_round/export/export_to_llmcompressor/export_to_static_fp.py
auto_round/export/export_to_llmcompressor/utils.py
auto_round/inference/__init__.py
auto_round/inference/backend.py
auto_round/inference/convert_model.py
auto_round/inference/utils.py
auto_round/modeling/__init__.py
auto_round/modeling/finegrained_fp8_patch.py
auto_round/modeling/finegrained_fp8_patch_v4.py
auto_round/modeling/fp8_quant.py
auto_round/modeling/hpu_patch.py
auto_round/modeling/fused_moe/__init__.py
auto_round/modeling/fused_moe/deepseek_v2.py
auto_round/modeling/fused_moe/gpt_oss.py
auto_round/modeling/fused_moe/llama4.py
auto_round/modeling/fused_moe/moe_experts_interface.py
auto_round/modeling/fused_moe/qwen3_5_moe.py
auto_round/modeling/fused_moe/qwen3_omni.py
auto_round/modeling/fused_moe/qwen3_vl_moe.py
auto_round/modeling/fused_moe/replace_modules.py
auto_round/modeling/fused_moe/step3_5_moe.py
auto_round/modeling/fused_moe/utils.py
auto_round/modeling/unfused_moe/__init__.py
auto_round/modeling/unfused_moe/deepseek_v3.py
auto_round/modeling/unfused_moe/ernie4_5_moe.py
auto_round/modeling/unfused_moe/glm_moe.py
auto_round/modeling/unfused_moe/glm_moe_dsa.py
auto_round/modeling/unfused_moe/glm_moe_light.py
auto_round/modeling/unfused_moe/qwen3_moe.py
auto_round/modeling/unfused_moe/qwen3_next.py
auto_round/utils/__init__.py
auto_round/utils/common.py
auto_round/utils/device.py
auto_round/utils/distributed.py
auto_round/utils/missing_tensors.py
auto_round/utils/model.py
auto_round/utils/offload.py
auto_round/utils/weight_handler.py
auto_round_extension/__init__.py
auto_round_extension/ark/__init__.py
auto_round_extension/ark/install_kernel.py
auto_round_extension/ark/qlinear.py
auto_round_extension/cuda/__init__.py
auto_round_extension/cuda/gptqmodel_marlin.py
auto_round_extension/hpu/__init__.py
auto_round_extension/hpu/qlinear_hpu.py
auto_round_extension/hpu/qlinear_hpu_gptq.py
auto_round_extension/ipex/__init__.py
auto_round_extension/ipex/qlinear_ipex_awq.py
auto_round_extension/ipex/qlinear_ipex_gptq.py
auto_round_extension/torch/__init__.py
auto_round_extension/torch/qlinear_torch.py
auto_round_extension/torch/qlinear_torch_zp.py
auto_round_extension/triton/__init__.py
auto_round_extension/triton/qlinear_tritonv2.py
auto_round_extension/triton/qlinear_tritonv2_zp.py
auto_round_extension/triton/triton_utils/__init__.py
auto_round_extension/triton/triton_utils/custom_autotune.py
auto_round_extension/triton/triton_utils/dequant.py
auto_round_extension/triton/triton_utils/kernels.py
auto_round_extension/triton/triton_utils/mixin.py
auto_round_extension/triton/triton_utils_zp/__init__.py
auto_round_extension/triton/triton_utils_zp/custom_autotune.py
auto_round_extension/triton/triton_utils_zp/dequant.py
auto_round_extension/triton/triton_utils_zp/kernels.py
auto_round_extension/triton/triton_utils_zp/mixin.py
auto_round_extension/vllm_ext/__init__.py
auto_round_extension/vllm_ext/auto_round_ext.py
auto_round_extension/vllm_ext/envs_ext.py
auto_round_extension/vllm_ext/fp4_utils.py
auto_round_extension/vllm_ext/kv_cache.py
auto_round_extension/vllm_ext/linear_impl_mxfp4.py
auto_round_extension/vllm_ext/linear_impl_mxfp8.py
auto_round_extension/vllm_ext/moe_impl_mxfp4.py
auto_round_extension/vllm_ext/moe_impl_mxfp8.py
auto_round_extension/vllm_ext/mxfp4_qdq_utils.py
auto_round_extension/vllm_ext/mxfp8_qdq_utils.py
auto_round_extension/vllm_ext/quant_impl.py
auto_round_extension/vllm_ext/quant_method_linear.py
auto_round_extension/vllm_ext/quant_method_moe.py
auto_round_extension/vllm_ext/sitecustomize.py
auto_round_extension/vllm_ext/utils.py
auto_round_extension/vllm_ext/vllm_oot_patches.py