{"library":"ctransformers","type":"library","category":null,"description":"Python bindings for Transformer models implemented in C/C++ using the GGML library. Provides a high-level API for inference with popular models (LLaMA, Falcon, GPT-J, StarCoder, etc.) in GGML/GGUF format, with optional GPU acceleration (CUDA, Metal, ROCm). Latest version 0.2.27, active development.","language":"python","status":"active","version":"0.2.27","tags":["llm","inference","ggml","gguf","transformer","cuda","metal","rocm"],"last_verified":"Fri May 01","install":[{"cmd":"pip install ctransformers","imports":["from ctransformers import AutoModelForCausalLM"]},{"cmd":"pip install ctransformers[cuda]","imports":[]},{"cmd":"pip install ctransformers[metal]","imports":[]},{"cmd":"pip install ctransformers[rocm]","imports":[]}],"homepage":"https://ctransformers.dev","github":"https://github.com/marella/ctransformers","docs":null,"changelog":null,"pypi":"https://pypi.org/project/ctransformers/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":null}