{"library":"nvidia-modelopt-core","type":"library","category":null,"description":"The NVIDIA TensorRT Model Optimizer (ModelOpt) provides a unified toolkit for model optimization and deployment across NVIDIA GPUs, supporting quantization (PTQ, QAT), pruning, distillation, and TensorRT export. As of v0.33.1, the library is actively maintained and targets Python 3.10–3.12. Release cadence is approximately monthly.","language":"python","status":"active","version":"0.33.1","tags":["model-optimization","quantization","tensorrt","pruning","distillation"],"last_verified":"Sun Jun 07","install":[{"cmd":"pip install nvidia-modelopt-core","imports":["from modelopt.torch.opt import ModelOptTorchModel","from modelopt.torch.quantization import quantize"]},{"cmd":"pip install nvidia-modelopt-core[all]","imports":[]}],"homepage":"https://github.com/NVIDIA/TensorRT-Model-Optimizer","github":"https://github.com/NVIDIA/TensorRT-Model-Optimizer","docs":null,"changelog":null,"pypi":null,"npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":null}