{"library":"deepeval","type":"library","category":null,"description":"DeepEval is an LLM evaluation framework that helps developers evaluate any LLM workflow, from simple prompt chains to complex multi-step agents. It provides a suite of metrics for various evaluation aspects like relevancy, faithfulness, hallucination, and agentic task completion. Currently at version 3.9.6, the library maintains a frequent release cadence, often introducing new metrics, test case types, and developer experience improvements.","language":"python","status":"active","version":"3.9.6","tags":["LLM evaluation","AI agents","metrics","observability","testing","rag"],"last_verified":"Wed May 20","install":[{"cmd":"pip install deepeval","imports":["from deepeval import evaluate","from deepeval.test_case import LLMTestCase","from deepeval.test_case import Turn","from deepeval.metrics import AnswerRelevancyMetric"]}],"homepage":"https://docs.confident-ai.com","github":"https://github.com/confident-ai/deepeval","docs":"https://deepeval.com","changelog":null,"pypi":"https://pypi.org/project/deepeval/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":90,"avg_install_s":14.2,"avg_import_s":5.52,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/deepeval/compatibility"}}