{"library":"mamba-ssm","title":"Mamba State-Space Model","description":"Mamba is a state-space model architecture designed for efficient sequence modeling, offering linear-time inference and parallelizable training. Currently at version 2.3.1, it requires Python >=3.9 and is under active development with frequent releases focused on ROCm and CUDA compatibility.","language":"python","status":"active","last_verified":"Mon Apr 27","install":{"commands":["pip install mamba-ssm","pip install mamba-ssm[causal-conv1d]"],"cli":null},"imports":["from mamba_ssm import Mamba","from mamba_ssm import Mamba2"],"auth":{"required":false,"env_vars":[]},"quickstart":{"code":"import torch\nfrom mamba_ssm import Mamba\n\nbatch, seq_len, dim = 2, 128, 16\nmodel = Mamba(\n    d_model=dim,\n    d_state=16,\n    d_conv=4,\n    expand_factor=2,\n    dt_rank='auto',\n    bias=False,\n    conv_bias=True,\n    pscan=False,\n    device='cuda',\n    dtype=torch.float16\n)\nx = torch.randn(batch, seq_len, dim, device='cuda', dtype=torch.float16)\ny = model(x)\nprint(y.shape)\n# Expected: (2, 128, 16)","lang":"python","description":"Instantiate a Mamba model and run a forward pass on GPU with float16 precision.","tag":null,"tag_description":null,"last_tested":null,"results":[]},"compatibility":null}