{"id":28020,"library":"ossdata","title":"OSSDatasets","description":"OSSDatasets provides scalable access to Software Engineering datasets such as SWE-bench and GitHub issue data. It downloads and caches datasets locally for reproducible ML experiments. Current version 0.3.7, release cadence irregular.","status":"active","version":"0.3.7","language":"python","source_language":"en","source_url":"https://github.com/SWE-bench/OSSDatasets","tags":["datasets","swe-bench","software-engineering","ml"],"install":[{"cmd":"pip install ossdata","lang":"bash","label":"Default install"}],"dependencies":[],"imports":[{"note":"","wrong":"","symbol":"load_dataset","correct":"from ossdata import load_dataset"}],"quickstart":{"code":"import os\nfrom ossdata import load_dataset\n\n# Load SWE-bench dataset (cached automatically)\ndataset = load_dataset('swe-bench', split='train')\nprint(dataset[:2])","lang":"python","description":"Load a dataset by name (e.g., 'swe-bench') with automatic caching. Returns a list of dicts."},"warnings":[{"fix":"Check the exact dataset name in the docs.","message":"The dataset name must be exact; allowed names: 'swe-bench', 'swe-bench-lite', 'github-issues' (case-sensitive).","severity":"gotcha","affected_versions":"all"},{"fix":"Wrap with `pd.DataFrame(dataset)` or use dict-comprehensions.","message":"The returned data format is a list of dicts, not a Hugging Face Dataset or pandas DataFrame. You may need to convert manually.","severity":"gotcha","affected_versions":"0.3.x"},{"fix":"Use `from ossdata import load_dataset` and call `load_dataset(...)`.","message":"Version 0.2.x and earlier used a different API: `import ossdata` then `ossdata.get_dataset(...)`. The old API is removed in 0.3.0.","severity":"breaking","affected_versions":">=0.3.0"}],"env_vars":null,"last_verified":"2026-05-09T00:00:00.000Z","next_check":"2026-08-07T00:00:00.000Z","problems":[{"fix":"Run `pip install ossdata` in your active Python environment.","cause":"Package not installed or installed in wrong environment.","error":"ModuleNotFoundError: No module named 'ossdata'"},{"fix":"Use exact dataset name with hyphens: `load_dataset('swe-bench', ...)`.","cause":"Dataset name typo (underscore instead of hyphen).","error":"ValueError: Dataset 'swe_bench' not found. Available datasets: ['swe-bench', 'swe-bench-lite', 'github-issues']"}],"ecosystem":"pypi","meta_description":null,"install_score":null,"install_tag":null,"quickstart_score":null,"quickstart_tag":null}