{"library":"transformer-engine-cu12","type":"library","category":null,"description":"Transformer Engine (TE) is a Python library by NVIDIA for accelerating Transformer models on NVIDIA GPUs. It enables lower precision training and inference, notably supporting 8-bit (FP8) and 4-bit (NVFP4) floating point precision on Hopper, Ada, and Blackwell GPUs, leading to better performance and reduced memory utilization. It provides highly optimized building blocks for popular Transformer architectures and an automatic mixed precision-like API for PyTorch and JAX. The current version is 2.13.0, with an active release cadence, often aligning with new NVIDIA hardware and software advancements.","language":"python","status":"active","version":"2.13.0","tags":["AI/ML","Deep Learning","Transformers","NVIDIA","CUDA","Performance","Mixed Precision","FP8","FP4","PyTorch","JAX"],"last_verified":"Mon May 25","install":[{"cmd":"pip install --no-build-isolation transformer-engine-cu12[pytorch]","imports":["from transformer_engine.pytorch import Linear","from transformer_engine.pytorch import LayerNorm","from transformer_engine.pytorch import TransformerLayer","from transformer_engine.pytorch.fp8 import fp8_autocast"]},{"cmd":"pip install --no-build-isolation transformer-engine-cu12[jax]","imports":[]},{"cmd":"pip install --no-build-isolation transformer-engine-cu12[core]","imports":[]}],"homepage":"https://www.nvidia.com/en-us/data-center/products/transformer-engine/","github":null,"docs":null,"changelog":null,"pypi":"https://pypi.org/project/transformer-engine-cu12/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":12,"avg_import_s":null,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/transformer-engine-cu12/compatibility"}}