{"library":"bfcl-eval","type":"library","category":null,"description":"bfcl-eval is the Python library for the Berkeley Function Calling Leaderboard (BFCL), a benchmark to evaluate Large Language Models (LLMs) on their ability to perform function calling. It provides the evaluation pipeline and datasets, including support for multi-step and multi-turn function calls as of its V3 release. The library is actively maintained with frequent updates, with its current PyPI version being 2026.3.23.","language":"python","status":"active","version":"2026.3.23","tags":["LLM evaluation","function calling","AI leaderboard","benchmark","tool use"],"last_verified":"Mon May 25","install":[{"cmd":"pip install bfcl-eval","imports":["from bfcl_eval.eval_pipeline import eval_handler","from bfcl_eval.eval_pipeline import EvalMetrics"]}],"homepage":null,"github":"https://github.com/ShishirPatil/gorilla","docs":null,"changelog":null,"pypi":"https://pypi.org/project/bfcl-eval/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":60,"avg_install_s":80.5,"avg_import_s":null,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/bfcl-eval/compatibility"}}