{"library":"ring-flash-attn","type":"library","category":null,"description":"Ring attention implementation with flash attention for efficient long-context LLM training. Supports distributed memory and compute parallelism. Current version: 0.1.8, actively maintained on GitHub, weekly releases.","language":"python","status":"active","version":"0.1.8","tags":["flash-attention","ring-attention","long-context","transformer","distributed"],"last_verified":"Sun Jun 07","install":[{"cmd":"pip install ring-flash-attn","imports":["from ring_flash_attn import ring_flash_attn_func","from ring_flash_attn import zigzag_ring_flash_attn_func"]},{"cmd":"pip install ring-flash-attn[flash-attn]","imports":[]}],"homepage":"https://github.com/zhuzilin/ring-flash-attention","github":"https://github.com/zhuzilin/ring-flash-attention","docs":null,"changelog":null,"pypi":null,"npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":null}