{"library":"agentevals","type":"library","category":null,"description":"Agentevals is an open-source Python library from Microsoft designed to help developers effectively evaluate the performance of Large Language Model (LLM) agents. It provides a framework for defining custom agents, various types of evaluators (e.g., code execution, human feedback), and structured scenarios for consistent testing. The library is currently in early development (v0.0.9) and is expected to have regular updates with evolving features and APIs.","language":"python","status":"active","version":"0.0.9","tags":["LLM","agent","evaluation","AI","Microsoft","testing"],"last_verified":"Mon May 25","install":[{"cmd":"pip install agentevals","imports":["from agentevals.agents import CustomAgent","from agentevals.evaluators import CodeExecutionEvaluator","from agentevals.scenarios import HumanFeedbackScenario"]}],"homepage":null,"github":null,"docs":null,"changelog":null,"pypi":"https://pypi.org/project/agentevals/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":11.4,"avg_import_s":null,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/agentevals/compatibility"}}