{"library":"pycuda","title":"PyCUDA","description":"PyCUDA is a Python wrapper for Nvidia CUDA. It provides access to Nvidia's CUDA parallel computation API from Python. The latest version is 2026.1 (requires Python ~=3.8). Release cadence is roughly semi-annual.","language":"python","status":"active","last_verified":"Fri May 01","install":{"commands":["pip install pycuda"],"cli":null},"imports":["import pycuda.autoinit","import pycuda.driver as cuda","from pycuda.compiler import SourceModule"],"auth":{"required":false,"env_vars":[]},"quickstart":{"code":"import pycuda.autoinit\nimport pycuda.driver as cuda\nimport numpy as np\nfrom pycuda.compiler import SourceModule\n\nmod = SourceModule(\"\"\"\n__global__ void add_one(float *a)\n{\n    int idx = threadIdx.x;\n    a[idx] += 1.0f;\n}\n\"\"\")\n\nadd_one = mod.get_function(\"add_one\")\na = np.float32([1.0, 2.0, 3.0])\nadd_one(cuda.InOut(a), block=(32,1,1), grid=(1,1))\nprint(a)","lang":"python","description":"Kernel that adds 1 to each element of a float array.","tag":null,"tag_description":null,"last_tested":null,"results":[]},"compatibility":null}