{ "info": { "author": "Amazon Web Services", "author_email": "agent-evaluation-oss-core-team@amazon.com", "bugtrack_url": null, "classifiers": [ "Development Status :: 4 - Beta", "Intended Audience :: Developers", "License :: OSI Approved :: Apache Software License", "Programming Language :: Python :: 3 :: Only", "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", "Programming Language :: Python :: 3.12", "Programming Language :: Python :: 3.9", "Topic :: Software Development :: Testing", "Topic :: Utilities" ], "description": "![PyPI - Version](https://img.shields.io/pypi/v/agent-evaluation)\n![PyPI - Python Version](https://img.shields.io/pypi/pyversions/agent-evaluation)\n![GitHub License](https://img.shields.io/github/license/awslabs/agent-evaluation)\n[![security: bandit](https://img.shields.io/badge/security-bandit-yellow.svg)](https://github.com/PyCQA/bandit)\n[![Code style: black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)\n[![Built with Material for MkDocs](https://img.shields.io/badge/Material_for_MkDocs-526CFE?style=for-the-badge&logo=MaterialForMkDocs&logoColor=white)](https://squidfunk.github.io/mkdocs-material/)\n\n# Agent Evaluation\n\nAgent Evaluation is a generative AI-powered framework for testing virtual agents.\n\nInternally, Agent Evaluation implements an LLM agent (evaluator) that will orchestrate conversations with your own agent (target) and evaluate the responses during the conversation.\n\n## \u2728 Key features\n\n- Built-in support for popular AWS services including [Amazon Bedrock](https://aws.amazon.com/bedrock/), [Amazon Q Business](https://aws.amazon.com/q/business/), and [Amazon SageMaker](https://aws.amazon.com/sagemaker/). You can also [bring your own agent](https://awslabs.github.io/agent-evaluation/targets/custom_targets/) to test using Agent Evaluation.\n- Orchestrate concurrent, multi-turn conversations with your agent while evaluating its responses.\n- Define [hooks](https://awslabs.github.io/agent-evaluation/hooks/) to perform additional tasks such as integration testing.\n- Can be incorporated into CI/CD pipelines to expedite the time to delivery while maintaining the stability of agents in production environments.\n\n## \ud83d\udcda Documentation\n\nTo get started, please visit the full documentation [here](https://awslabs.github.io/agent-evaluation/). To contribute, please refer to [CONTRIBUTING.md](./CONTRIBUTING.md)\n\n## \ud83d\udc4f Contributors\n\nShout out to these awesome contributors:\n\n\n \n\n", "description_content_type": "text/markdown", "docs_url": null, "download_url": null, "downloads": { "last_day": -1, "last_month": -1, "last_week": -1 }, "dynamic": null, "home_page": "https://awslabs.github.io/agent-evaluation/", "keywords": null, "license": "Apache 2.0", "maintainer": null, "maintainer_email": null, "name": "agent-evaluation", "package_url": "https://pypi.org/project/agent-evaluation/", "platform": null, "project_url": "https://pypi.org/project/agent-evaluation/", "project_urls": { "Homepage": "https://awslabs.github.io/agent-evaluation/" }, "provides_extra": null, "release_url": "https://pypi.org/project/agent-evaluation/0.2.0/", "requires_dist": [ "pyyaml~=6.0", "boto3<2.0,>=1.34.20", "click~=8.0", "pydantic<3.0,>=2.1.0", "rich<14.0,>=13.7.0", "jinja2<4.0,>=3.1.3", "jsonpath-ng<2.0,>=1.6.1", "flake8; extra == \"dev\"", "black; extra == \"dev\"", "isort; extra == \"dev\"", "pytest; extra == \"dev\"", "pytest-cov; extra == \"dev\"", "pytest-mock; extra == \"dev\"", "mkdocs; extra == \"dev\"", "mkdocs-material; extra == \"dev\"", "mkdocstrings[python]; extra == \"dev\"", "mkdocs-click; extra == \"dev\"", "bandit; extra == \"dev\"", "pip-audit; extra == \"dev\"" ], "requires_python": ">=3.9", "summary": "A generative AI-powered framework for testing virtual agents.", "version": "0.2.0", "yanked": false, "yanked_reason": null }, "last_serial": 23191089, "releases": { "0.1.0": [ { "comment_text": "", "digests": { "blake2b_256": "d7e6731c68918c5fce4c71c58096ffb36d87ce70d925bdd825538e46d12fdab2", "md5": "0f9d744eff88fc238a56ae6f6df7944e", "sha256": "6c8876df6bb6fb932c724fa9ad16e31f81e60d4f7fd5986eba4651925ae183c5" }, "downloads": -1, "filename": "agent_evaluation-0.1.0-py3-none-any.whl", "has_sig": false, "md5_digest": "0f9d744eff88fc238a56ae6f6df7944e", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": ">=3.9", "size": 34665, "upload_time": "2024-05-03T22:25:09", "upload_time_iso_8601": "2024-05-03T22:25:09.390348Z", "url": "https://files.pythonhosted.org/packages/d7/e6/731c68918c5fce4c71c58096ffb36d87ce70d925bdd825538e46d12fdab2/agent_evaluation-0.1.0-py3-none-any.whl", "yanked": false, "yanked_reason": null }, { "comment_text": "", "digests": { "blake2b_256": "94a9fb463164dc38d476d3a544c9128607e4938095b72b24d64a172413439654", "md5": "375716b2f472dc6ed06e329ec14612b9", "sha256": "9209839c593be496a8c6764fe99562525d3c496685dfb4c6949006631ab2501d" }, "downloads": -1, "filename": "agent_evaluation-0.1.0.tar.gz", "has_sig": false, "md5_digest": "375716b2f472dc6ed06e329ec14612b9", "packagetype": "sdist", "python_version": "source", "requires_python": ">=3.9", "size": 22330, "upload_time": "2024-05-03T22:25:11", "upload_time_iso_8601": "2024-05-03T22:25:11.143570Z", "url": "https://files.pythonhosted.org/packages/94/a9/fb463164dc38d476d3a544c9128607e4938095b72b24d64a172413439654/agent_evaluation-0.1.0.tar.gz", "yanked": false, "yanked_reason": null } ], "0.2.0": [ { "comment_text": "", "digests": { "blake2b_256": "2fbcbbe6230edacd58b04c2d83c09fe8db799e5f4e3d372e5b1ca93da93012b9", "md5": "e24e4c79a950f67627047cc128dbab0a", "sha256": "ba24cc7e845435e9c5a50fadcaa9cbdd121dd7ead3edd135638f303e4babd312" }, "downloads": -1, "filename": "agent_evaluation-0.2.0-py3-none-any.whl", "has_sig": false, "md5_digest": "e24e4c79a950f67627047cc128dbab0a", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": ">=3.9", "size": 34677, "upload_time": "2024-05-13T21:14:27", "upload_time_iso_8601": "2024-05-13T21:14:27.018943Z", "url": "https://files.pythonhosted.org/packages/2f/bc/bbe6230edacd58b04c2d83c09fe8db799e5f4e3d372e5b1ca93da93012b9/agent_evaluation-0.2.0-py3-none-any.whl", "yanked": false, "yanked_reason": null }, { "comment_text": "", "digests": { "blake2b_256": "de348fc0850168c265da48c5082d8099cd50815372e164bd54b30479035b35d6", "md5": "372ea8b92c13456e6b20fae18312884b", "sha256": "afaada1e206022d4c3c2fece8e1494571aef4ca64d912badd6dd851b4fd4b2ac" }, "downloads": -1, "filename": "agent_evaluation-0.2.0.tar.gz", "has_sig": false, "md5_digest": "372ea8b92c13456e6b20fae18312884b", "packagetype": "sdist", "python_version": "source", "requires_python": ">=3.9", "size": 22294, "upload_time": "2024-05-13T21:14:28", "upload_time_iso_8601": "2024-05-13T21:14:28.862452Z", "url": "https://files.pythonhosted.org/packages/de/34/8fc0850168c265da48c5082d8099cd50815372e164bd54b30479035b35d6/agent_evaluation-0.2.0.tar.gz", "yanked": false, "yanked_reason": null } ] }, "urls": [ { "comment_text": "", "digests": { "blake2b_256": "2fbcbbe6230edacd58b04c2d83c09fe8db799e5f4e3d372e5b1ca93da93012b9", "md5": "e24e4c79a950f67627047cc128dbab0a", "sha256": "ba24cc7e845435e9c5a50fadcaa9cbdd121dd7ead3edd135638f303e4babd312" }, "downloads": -1, "filename": "agent_evaluation-0.2.0-py3-none-any.whl", "has_sig": false, "md5_digest": "e24e4c79a950f67627047cc128dbab0a", "packagetype": "bdist_wheel", "python_version": "py3", "requires_python": ">=3.9", "size": 34677, "upload_time": "2024-05-13T21:14:27", "upload_time_iso_8601": "2024-05-13T21:14:27.018943Z", "url": "https://files.pythonhosted.org/packages/2f/bc/bbe6230edacd58b04c2d83c09fe8db799e5f4e3d372e5b1ca93da93012b9/agent_evaluation-0.2.0-py3-none-any.whl", "yanked": false, "yanked_reason": null }, { "comment_text": "", "digests": { "blake2b_256": "de348fc0850168c265da48c5082d8099cd50815372e164bd54b30479035b35d6", "md5": "372ea8b92c13456e6b20fae18312884b", "sha256": "afaada1e206022d4c3c2fece8e1494571aef4ca64d912badd6dd851b4fd4b2ac" }, "downloads": -1, "filename": "agent_evaluation-0.2.0.tar.gz", "has_sig": false, "md5_digest": "372ea8b92c13456e6b20fae18312884b", "packagetype": "sdist", "python_version": "source", "requires_python": ">=3.9", "size": 22294, "upload_time": "2024-05-13T21:14:28", "upload_time_iso_8601": "2024-05-13T21:14:28.862452Z", "url": "https://files.pythonhosted.org/packages/de/34/8fc0850168c265da48c5082d8099cd50815372e164bd54b30479035b35d6/agent_evaluation-0.2.0.tar.gz", "yanked": false, "yanked_reason": null } ], "vulnerabilities": [] }