{"library":"autoawq","type":"library","category":null,"description":"AutoAWQ implements the AWQ (Activation-aware Weight Quantization) algorithm for 4-bit quantization of large language models, achieving up to 2x speedup during inference. The library is now deprecated as of v0.2.9 (April 2025), with vLLM having adopted the technology. Last tested with Torch 2.6.0 and Transformers 4.51.3.","language":"python","status":"deprecated","version":"0.2.9","tags":["quantization","awq","4-bit","llm","inference","deprecated"],"install":[{"cmd":"pip install autoawq","imports":["from awq import AutoAWQForCausalLM","from awq import AutoAWQConfig"]},{"cmd":"pip install autoawq[extras]","imports":[]}],"homepage":null,"github":"https://github.com/casper-hansen/AutoAWQ","docs":null,"changelog":null,"pypi":"https://pypi.org/project/autoawq/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":20,"avg_install_s":80.6,"avg_import_s":22.52,"wheel_type":"sdist"},"url":"https://checklist.day/v1/registry/autoawq/compatibility"},"provenance":{"verified_status":"passing","verified_at":"Sun Jun 28","last_verified":"Sun Jun 28","next_check":"Tue Jul 28","install_tag":null}}