diff --git a/libs/langchain/tests/unit_tests/smith/evaluation/test_runner_utils.py b/libs/langchain/tests/unit_tests/smith/evaluation/test_runner_utils.py index 6291d241f4977..914958031dcf1 100644 --- a/libs/langchain/tests/unit_tests/smith/evaluation/test_runner_utils.py +++ b/libs/langchain/tests/unit_tests/smith/evaluation/test_runner_utils.py @@ -296,8 +296,8 @@ async def mock_arun_chain( tags: Optional[List[str]] = None, callbacks: Optional[Any] = None, **kwargs: Any, - ) -> List[Dict[str, Any]]: - return [{"result": f"Result for example {example.id}"}] + ) -> Dict[str, Any]: + return {"result": f"Result for example {example.id}"} def mock_create_project(*args: Any, **kwargs: Any) -> Any: proj = mock.MagicMock() @@ -324,9 +324,10 @@ def mock_create_project(*args: Any, **kwargs: Any) -> Any: ) expected = { - uuid_: [ - {"result": f"Result for example {uuid.UUID(uuid_)}"} for _ in range(1) - ] + uuid_: { + "output": {"result": f"Result for example {uuid.UUID(uuid_)}"}, + "feedback": [], + } for uuid_ in uuids } assert results["results"] == expected