{"library":"datasketches","type":"library","category":null,"description":"The Apache DataSketches Library for Python provides a collection of high-performance, stochastic streaming algorithms (sketches) for approximate queries on massive datasets. These sketches offer mathematically proven error bounds and are designed for problems like count distinct, quantiles, most-frequent items, joins, matrix computations, and graph analysis. The current version is 5.2.0, with a regular release cadence as part of the Apache DataSketches project.","language":"python","status":"active","version":"5.2.0","tags":["data sketches","streaming algorithms","approximate queries","big data","quantiles","distinct count","probabilistic data structures","high-performance computing"],"last_verified":"Sat May 23","install":[{"cmd":"pip install datasketches","imports":["import datasketches","from datasketches import kll_ints_sketch"]}],"homepage":"http://datasketches.apache.org","github":null,"docs":null,"changelog":null,"pypi":"https://pypi.org/project/datasketches/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":3.6,"avg_import_s":0.27,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/datasketches/compatibility"}}