{"library":"runai-model-streamer-s3","type":"library","category":null,"description":"The `runai-model-streamer-s3` library acts as a backend for the `runai-model-streamer`, enabling high-performance streaming of AI model weights (specifically Safetensors format) directly from S3-compatible object storage to GPU memory. It significantly reduces model loading times, addressing 'cold start' issues for large language models in inference scenarios. The current version is 0.15.8, with releases often aligned with the main `runai-model-streamer` project.","language":"en","status":"active","version":"0.15.8","tags":["AI/ML","model serving","S3","streaming","GPU","vLLM","LLM"],"last_verified":"Wed May 27","install":[{"cmd":"pip install runai-model-streamer-s3","imports":["from runai_model_streamer import SafetensorsStreamer"]},{"cmd":"pip install vllm[runai]","imports":[]}],"homepage":null,"github":null,"docs":null,"changelog":null,"pypi":null,"npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":25,"avg_install_s":3.8,"avg_import_s":null,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/runai-model-streamer-s3/compatibility"}}