{"library":"cerebras-cloud-sdk","type":"library","category":null,"description":"Official Python SDK for the Cerebras Cloud inference API. Provides access to ultra-fast LLM inference on Cerebras Wafer-Scale Engine hardware. OpenAI-compatible API surface. Generated with Stainless. Current version: 1.67.0 (Mar 2026). Requires Python 3.9+. Note: separate from cerebras-sdk (PyPI) which is a hardware kernel development tool — completely different product.","language":"python","status":"active","version":"1.67.0","tags":["cerebras","llm","inference","python","fast-inference","llama"],"last_verified":"Tue Jun 09","install":[{"cmd":"pip install cerebras-cloud-sdk","imports":["from cerebras.cloud.sdk import Cerebras\nimport os\n\nclient = Cerebras(\n    api_key=os.environ.get('CEREBRAS_API_KEY')\n)\n\nresponse = client.chat.completions.create(\n    model='llama3.1-8b',\n    messages=[{'role': 'user', 'content': 'Why is fast inference important?'}]\n)\nprint(response.choices[0].message.content)","from cerebras.cloud.sdk import AsyncCerebras\nimport asyncio, os\n\nclient = AsyncCerebras(\n    api_key=os.environ.get('CEREBRAS_API_KEY')\n)\n\nasync def main():\n    response = await client.chat.completions.create(\n        model='llama3.1-8b',\n        messages=[{'role': 'user', 'content': 'Hello'}]\n    )\n    print(response.choices[0].message.content)\n\nasyncio.run(main())"]}],"homepage":"https://cloud.cerebras.ai","github":"https://github.com/Cerebras/cerebras-cloud-sdk-python","docs":null,"changelog":null,"pypi":"https://pypi.org/project/cerebras-cloud-sdk/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":4.2,"avg_import_s":0.86,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/cerebras-cloud-sdk/compatibility"}}