{"library":"agentevals","type":"library","category":null,"description":"Agentevals is an open-source Python library from Microsoft designed to help developers effectively evaluate the performance of Large Language Model (LLM) agents. It provides a framework for defining custom agents, various types of evaluators (e.g., code execution, human feedback), and structured scenarios for consistent testing. The library is currently in early development (v0.0.9) and is expected to have regular updates with evolving features and APIs.","language":"python","status":"active","version":"0.0.9","tags":["LLM","agent","evaluation","AI","Microsoft","testing"],"install":[{"cmd":"pip install agentevals","imports":["import agentevals"]}],"homepage":null,"github":null,"docs":null,"changelog":null,"pypi":"https://pypi.org/project/agentevals/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":11.7,"avg_import_s":null,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/agentevals/compatibility"},"provenance":{"verified_status":"passing","verified_at":"Fri Jul 03","last_verified":"Fri Jul 03","next_check":"Sun Aug 02","install_tag":null}}