{"library":"auto-round","type":"library","category":null,"description":"AutoRound is an advanced weight-only quantization algorithm for large language models (LLMs), providing up to 4-bit quantization with minimal accuracy loss. Current version 0.13.0 supports various Intel and AMD GPUs, as well as CPUs. The package is under active development by Intel.","language":"python","status":"active","version":"0.13.0","tags":["quantization","llm","weight-only","intel","gpu"],"last_verified":"Sun Jun 07","install":[{"cmd":"pip install auto-round","imports":["from auto_round import AutoRound","from auto_round import AutoRoundConfig"]}],"homepage":"https://github.com/intel/auto-round","github":"https://github.com/intel/auto-round","docs":null,"changelog":null,"pypi":null,"npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":null}