From 784927205c6080ddb0d11f079ad3acba4a249eec Mon Sep 17 00:00:00 2001 From: Connor McCarthy Date: Mon, 18 Dec 2023 18:50:37 -0500 Subject: [PATCH] feat(sdk): add local execution logging #localexecution (#10326) --- sdk/python/kfp/local/e2e_test.py | 55 ----- sdk/python/kfp/local/logging_utils.py | 135 ++++++++++++ sdk/python/kfp/local/logging_utils_test.py | 206 ++++++++++++++++++ .../kfp/local/subprocess_task_handler.py | 6 +- sdk/python/kfp/local/task_dispatcher.py | 74 +++++-- sdk/python/kfp/local/task_dispatcher_test.py | 98 +++++++++ 6 files changed, 493 insertions(+), 81 deletions(-) create mode 100644 sdk/python/kfp/local/logging_utils.py create mode 100644 sdk/python/kfp/local/logging_utils_test.py diff --git a/sdk/python/kfp/local/e2e_test.py b/sdk/python/kfp/local/e2e_test.py index cffaf84638e..93d6622f0da 100644 --- a/sdk/python/kfp/local/e2e_test.py +++ b/sdk/python/kfp/local/e2e_test.py @@ -17,8 +17,6 @@ These can be thought of as local runner conformance tests. The test results should be the same irrespective of the runner. """ -import io -import sys from typing import NamedTuple import unittest @@ -323,58 +321,5 @@ def my_comp(out_param: dsl.OutputPath(str),) -> int: self.assertEqual(task.outputs['Output'], 1) -@parameterized.parameters(ALL_RUNNERS) -class TestExceptionHandling(testing_utilities.LocalRunnerEnvironmentTestCase): - - def setUp(self): - super().setUp() - # capture logs on a test-by-test basis - self.captured_stdout = io.StringIO() - sys.stdout = self.captured_stdout - - def tearDown(self): - super().setUp() - # reset stdout - sys.stdout = sys.__stdout__ - - def test_user_code_throws_exception_if_raise_on_error(self, runner): - local.init(runner=runner, raise_on_error=True) - - @dsl.component - def fail_comp(): - raise Exception('String to match on') - - # use end of line anchor $, since the user code error should be the last thing surfaced to the user - with self.assertRaisesRegex( - RuntimeError, - r'Local execution exited with status FAILURE\.$', - ): - fail_comp() - - self.assertIn( - 'Exception: String to match on', - self.captured_stdout.getvalue(), - ) - - def test_user_code_no_exception_if_not_raise_on_error(self, runner): - local.init(runner=runner, raise_on_error=False) - - @dsl.component - def fail_comp(): - raise Exception('String to match on') - - task = fail_comp() - self.assertDictEqual(task.outputs, {}) - - self.assertIn( - 'Local execution exited with status FAILURE.', - self.captured_stdout.getvalue(), - ) - self.assertIn( - 'Exception: String to match on', - self.captured_stdout.getvalue(), - ) - - if __name__ == '__main__': unittest.main() diff --git a/sdk/python/kfp/local/logging_utils.py b/sdk/python/kfp/local/logging_utils.py new file mode 100644 index 00000000000..dd4d2d90843 --- /dev/null +++ b/sdk/python/kfp/local/logging_utils.py @@ -0,0 +1,135 @@ +# Copyright 2023 The Kubeflow Authors +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Utilitites for formatting, coloring, and controlling the output of logs.""" +import builtins +import contextlib +import datetime +import logging +from typing import Any, Dict, Generator, List + +from kfp import dsl + + +class Color: + CYAN = '\033[96m' + GREEN = '\033[92m' + RED = '\033[91m' + RESET = '\033[0m' + + +class MillisecondFormatter(logging.Formatter): + + def formatTime( + self, + record: logging.LogRecord, + datefmt: str = None, + ) -> str: + created = datetime.datetime.fromtimestamp(record.created) + s = created.strftime(datefmt) + # truncate microseconds to milliseconds + return s[:-3] + + +@contextlib.contextmanager +def local_logger_context() -> Generator[None, None, None]: + """Context manager for creating and reseting the local execution logger.""" + + logger = logging.getLogger() + original_level = logger.level + original_handlers = logger.handlers[:] + formatter = MillisecondFormatter( + fmt='%(asctime)s - %(levelname)s - %(message)s', + datefmt='%H:%M:%S.%f', + ) + handler = logging.StreamHandler() + handler.setFormatter(formatter) + logger.handlers.clear() + logger.addHandler(handler) + logger.setLevel(logging.INFO) + + try: + yield + finally: + logger.setLevel(original_level) + logger.handlers.clear() + for handler in original_handlers: + logger.addHandler(handler) + + +@contextlib.contextmanager +def indented_print(num_spaces: int = 4) -> Generator[None, None, None]: + """Context manager to indent all print statements in its scope by + num_prints. + + Useful for visually separating a subprocess logs from the outer + process logs. + """ + original_print = builtins.print + + def indented_print_function(*args, **kwargs): + original_print(' ' * num_spaces, end='') + return original_print(*args, **kwargs) + + builtins.print = indented_print_function + try: + yield + finally: + builtins.print = original_print + + +def color_text(text: str, color: Color) -> str: + return f'{color}{text}{Color.RESET}' + + +def make_log_lines_for_artifact(artifact: dsl.Artifact,) -> List[str]: + """Returns a list of log lines that represent a single artifact output.""" + artifact_class_name_and_paren = f'{artifact.__class__.__name__}( ' + # name + artifact_lines = [f'{artifact_class_name_and_paren}name={artifact.name},'] + newline_spaces = len(artifact_class_name_and_paren) * ' ' + # uri + artifact_lines.append(f'{newline_spaces}uri={artifact.uri},') + # metadata + artifact_lines.append(f'{newline_spaces}metadata={artifact.metadata} )') + return artifact_lines + + +def make_log_lines_for_outputs(outputs: Dict[str, Any]) -> List[str]: + """Returns a list of log lines to repesent the outputs of a task.""" + INDENT = ' ' * 4 + SEPARATOR = ': ' + output_lines = [] + for key, value in outputs.items(): + key_chars = INDENT + key + SEPARATOR + + # present artifacts + if isinstance(value, dsl.Artifact): + artifact_lines = make_log_lines_for_artifact(value) + + first_artifact_line = artifact_lines[0] + output_lines.append(f'{key_chars}{first_artifact_line}') + + remaining_artifact_lines = artifact_lines[1:] + # indent to align with first char in artifact + # to visually separate output keys + remaining_artifact_lines = [ + len(key_chars) * ' ' + l for l in remaining_artifact_lines + ] + output_lines.extend(remaining_artifact_lines) + + # present params + else: + output_lines.append(f'{key_chars}{value}') + + return output_lines diff --git a/sdk/python/kfp/local/logging_utils_test.py b/sdk/python/kfp/local/logging_utils_test.py new file mode 100644 index 00000000000..9438863e16d --- /dev/null +++ b/sdk/python/kfp/local/logging_utils_test.py @@ -0,0 +1,206 @@ +# Copyright 2023 The Kubeflow Authors +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +"""Tests for logging_utils.py.""" + +import io +import unittest +from unittest import mock + +from kfp import dsl +from kfp.local import logging_utils + + +class TestIndentedPrint(unittest.TestCase): + + @mock.patch('sys.stdout', new_callable=io.StringIO) + def test(self, mocked_stdout): + with logging_utils.indented_print(num_spaces=6): + print('foo should be indented') + expected = ' foo should be indented\n' + actual = mocked_stdout.getvalue() + self.assertEqual( + actual, + expected, + ) + + +class TestColorText(unittest.TestCase): + + def test_cyan(self): + + actual = logging_utils.color_text( + 'text to color', + logging_utils.Color.CYAN, + ) + expected = '\x1b[91mtext to color\x1b[0m' + self.assertEqual(actual, expected) + + def test_cyan(self): + + actual = logging_utils.color_text( + 'text to color', + logging_utils.Color.RED, + ) + expected = '\x1b[91mtext to color\x1b[0m' + self.assertEqual(actual, expected) + + +class TestRenderArtifact(unittest.TestCase): + + def test_empty(self): + actual = logging_utils.make_log_lines_for_artifact(dsl.Artifact()) + expected = [ + 'Artifact( name=,', + ' uri=,', + ' metadata={} )', + ] + self.assertListEqual(actual, expected) + + def test_contains_value(self): + actual = logging_utils.make_log_lines_for_artifact( + dsl.Model( + name='my_artifact', + uri='/local/foo/bar', + metadata={ + 'dict_field': { + 'baz': 'bat' + }, + 'float_field': 3.14 + })) + expected = [ + 'Model( name=my_artifact,', + ' uri=/local/foo/bar,', + " metadata={'dict_field': {'baz': 'bat'}, 'float_field': 3.14} )", + ] + self.assertListEqual(actual, expected) + + +class TestMakeLogLinesForOutputs(unittest.TestCase): + + def test_empty(self): + actual = logging_utils.make_log_lines_for_outputs(dict()) + expected = [] + self.assertListEqual(actual, expected) + + def test_only_params(self): + actual = logging_utils.make_log_lines_for_outputs({ + 'foo': 'bar', + 'baz': 100, + 'bat': 1.0, + 'brap': True, + 'my_list': [1, 2, 3], + 'my_dict': { + 'foo': 'bar' + } + }) + expected = [ + ' foo: bar', + ' baz: 100', + ' bat: 1.0', + ' brap: True', + ' my_list: [1, 2, 3]', + " my_dict: {'foo': 'bar'}", + ] + self.assertListEqual(actual, expected) + + def test_only_artifacts(self): + actual = logging_utils.make_log_lines_for_outputs({ + 'my_artifact': + dsl.Artifact(name=''), + 'my_model': + dsl.Model( + name='my_artifact', + uri='/local/foo/bar/1234567890/1234567890/1234567890/1234567890/1234567890', + metadata={ + 'dict_field': { + 'baz': 'bat' + }, + 'float_field': 3.14 + }), + 'my_dataset': + dsl.Dataset( + name='my_dataset', + uri='/local/foo/baz', + metadata={}, + ), + }) + expected = [ + ' my_artifact: Artifact( name=,', + ' uri=,', + ' metadata={} )', + ' my_model: Model( name=my_artifact,', + ' uri=/local/foo/bar/1234567890/1234567890/1234567890/1234567890/1234567890,', + " metadata={'dict_field': {'baz': 'bat'}, 'float_field': 3.14} )", + ' my_dataset: Dataset( name=my_dataset,', + ' uri=/local/foo/baz,', + ' metadata={} )', + ] + self.assertListEqual(actual, expected) + + def test_mix_params_and_artifacts(self): + actual = logging_utils.make_log_lines_for_outputs({ + 'foo': + 'bar', + 'baz': + 100, + 'bat': + 1.0, + 'brap': + True, + 'my_list': [1, 2, 3], + 'my_dict': { + 'foo': 'bar' + }, + 'my_artifact': + dsl.Artifact(name=''), + 'my_model': + dsl.Model( + name='my_artifact', + uri='/local/foo/bar/1234567890/1234567890/1234567890/1234567890/1234567890', + metadata={ + 'dict_field': { + 'baz': 'bat' + }, + 'float_field': 3.14 + }), + 'my_dataset': + dsl.Dataset( + name='my_dataset', + uri='/local/foo/baz', + metadata={}, + ), + }) + expected = [ + ' foo: bar', + ' baz: 100', + ' bat: 1.0', + ' brap: True', + ' my_list: [1, 2, 3]', + " my_dict: {'foo': 'bar'}", + ' my_artifact: Artifact( name=,', + ' uri=,', + ' metadata={} )', + ' my_model: Model( name=my_artifact,', + ' uri=/local/foo/bar/1234567890/1234567890/1234567890/1234567890/1234567890,', + " metadata={'dict_field': {'baz': 'bat'}, 'float_field': 3.14} )", + ' my_dataset: Dataset( name=my_dataset,', + ' uri=/local/foo/baz,', + ' metadata={} )', + ] + + self.assertListEqual(actual, expected) + + +if __name__ == '__main__': + unittest.main() diff --git a/sdk/python/kfp/local/subprocess_task_handler.py b/sdk/python/kfp/local/subprocess_task_handler.py index 5821746420d..b22d70142f7 100644 --- a/sdk/python/kfp/local/subprocess_task_handler.py +++ b/sdk/python/kfp/local/subprocess_task_handler.py @@ -95,8 +95,10 @@ def run_local_subprocess(full_command: List[str]) -> int: with subprocess.Popen( full_command, stdout=subprocess.PIPE, - # no change to behavior in terminal for user, - # but allows more seamless capture/testing of subprocess logs + # No change to behavior in terminal for user, + # but inner process logs redirected to stdout. This separates from + # the outer process logs which, per logging module default, go to + # stderr. stderr=subprocess.STDOUT, text=True, # buffer line-by-line diff --git a/sdk/python/kfp/local/task_dispatcher.py b/sdk/python/kfp/local/task_dispatcher.py index 0e73cdfecf5..4c9f96158ca 100644 --- a/sdk/python/kfp/local/task_dispatcher.py +++ b/sdk/python/kfp/local/task_dispatcher.py @@ -12,12 +12,14 @@ # See the License for the specific language governing permissions and # limitations under the License. """Code for dispatching a local task execution.""" +import logging from typing import Any, Dict from kfp import local from kfp.local import config from kfp.local import executor_input_utils from kfp.local import executor_output_utils +from kfp.local import logging_utils from kfp.local import placeholder_utils from kfp.local import status from kfp.local import subprocess_task_handler @@ -108,33 +110,57 @@ def _run_single_component_implementation( subprocess_task_handler.SubprocessTaskHandler, } TaskHandler = task_handler_map[runner_type] - # TODO: add logging throughout for observability of state, execution progress, outputs, errors, etc. - task_handler = TaskHandler( - image=image, - full_command=full_command, - pipeline_root=pipeline_root, - runner=runner, - ) - task_status = task_handler.run() + with logging_utils.local_logger_context(): + task_name_for_logs = logging_utils.color_text( + f'{task_resource_name!r}', + logging_utils.Color.CYAN, + ) - if task_status == status.Status.SUCCESS: - outputs = executor_output_utils.get_outputs_for_task( - executor_input=executor_input, - component_spec=component_spec, + logging.info(f'Executing task {task_name_for_logs}') + task_handler = TaskHandler( + image=image, + full_command=full_command, + pipeline_root=pipeline_root, + runner=runner, ) - elif task_status == status.Status.FAILURE: - msg = f'Local execution exited with status {task_status.name}.' - if raise_on_error: - raise RuntimeError(msg) - else: - # TODO: replace with robust logging - print(msg) - outputs = {} + # trailing newline helps visually separate subprocess logs + logging.info(f'Streamed logs:\n') + + with logging_utils.indented_print(): + # subprocess logs printed here + task_status = task_handler.run() + + if task_status == status.Status.SUCCESS: + logging.info( + f'Task {task_name_for_logs} finished with status {logging_utils.color_text(task_status.value, logging_utils.Color.GREEN)}' + ) + + outputs = executor_output_utils.get_outputs_for_task( + executor_input=executor_input, + component_spec=component_spec, + ) + if outputs: + output_string = [ + f'Task {task_name_for_logs} outputs:', + *logging_utils.make_log_lines_for_outputs(outputs), + '\n', + ] + logging.info('\n'.join(output_string)) + else: + logging.info(f'Task {task_name_for_logs} has no outputs') + + elif task_status == status.Status.FAILURE: + msg = f'Task {task_name_for_logs} finished with status {logging_utils.color_text(task_status.value, logging_utils.Color.RED)}' + if raise_on_error: + raise RuntimeError(msg) + else: + logging.error(msg) + outputs = {} - else: - # for developers; user should never hit this - raise ValueError(f'Got unknown status: {task_status}') + else: + # for developers; user should never hit this + raise ValueError(f'Got unknown status: {task_status}') - return outputs + return outputs diff --git a/sdk/python/kfp/local/task_dispatcher_test.py b/sdk/python/kfp/local/task_dispatcher_test.py index 753fd7b3dc0..f0bacbe8955 100644 --- a/sdk/python/kfp/local/task_dispatcher_test.py +++ b/sdk/python/kfp/local/task_dispatcher_test.py @@ -19,12 +19,16 @@ irrespective of the runner. While there will inevitably some overlap, we should seek to minimize it. """ +import io import unittest +from unittest import mock from absl.testing import parameterized from kfp import dsl from kfp import local from kfp.dsl import Artifact +from kfp.dsl import Model +from kfp.dsl import Output from kfp.local import testing_utilities ALL_RUNNERS = [ @@ -184,5 +188,99 @@ def identity(x: str) -> str: self.assertEqual(actual, expected) +@parameterized.parameters(ALL_RUNNERS) +class TestExceptionHandlingAndLogging( + testing_utilities.LocalRunnerEnvironmentTestCase): + + @mock.patch('sys.stdout', new_callable=io.StringIO) + def test_user_code_throws_exception_if_raise_on_error( + self, + runner, + mock_stdout, + ): + local.init(runner=runner, raise_on_error=True) + + @dsl.component + def fail_comp(): + raise Exception('String to match on') + + with self.assertRaisesRegex( + RuntimeError, + r"Task \x1b\[96m'fail-comp'\x1b\[0m finished with status \x1b\[91mFAILURE\x1b\[0m", + ): + fail_comp() + + self.assertIn( + 'Exception: String to match on', + mock_stdout.getvalue(), + ) + + @mock.patch('sys.stdout', new_callable=io.StringIO) + @mock.patch('sys.stderr', new_callable=io.StringIO) + def test_user_code_no_exception_if_not_raise_on_error( + self, + runner, + mock_stderr, + mock_stdout, + ): + local.init(runner=runner, raise_on_error=False) + + @dsl.component + def fail_comp(): + raise Exception('String to match on') + + task = fail_comp() + self.assertDictEqual(task.outputs, {}) + + self.assertRegex( + mock_stderr.getvalue(), + r"\d+:\d+:\d+\.\d+ - ERROR - Task \x1b\[96m'fail-comp'\x1b\[0m finished with status \x1b\[91mFAILURE\x1b\[0m", + ) + self.assertIn( + 'Exception: String to match on', + mock_stdout.getvalue(), + ) + + @mock.patch('sys.stdout', new_callable=io.StringIO) + @mock.patch('sys.stderr', new_callable=io.StringIO) + def test_all_logs( + self, + runner, + mock_stderr, + mock_stdout, + ): + local.init(runner=runner) + + @dsl.component + def many_type_component( + num: int, + model: Output[Model], + ) -> str: + print('Inside of my component!') + model.metadata['foo'] = 'bar' + return 'hello' * num + + many_type_component(num=2) + + # outer process logs in stderr + outer_log_regex = ( + r"\d+:\d+:\d+\.\d+ - INFO - Executing task \x1b\[96m'many-type-component'\x1b\[0m\n" + + r'\d+:\d+:\d+\.\d+ - INFO - Streamed logs:\n\n' + + r"\d+:\d+:\d+\.\d+ - INFO - Task \x1b\[96m'many-type-component'\x1b\[0m finished with status \x1b\[92mSUCCESS\x1b\[0m\n" + + + r"\d+:\d+:\d+\.\d+ - INFO - Task \x1b\[96m'many-type-component'\x1b\[0m outputs:\n Output: hellohello\n model: Model\( name=model,\n uri=\./local_outputs/many-type-component-\d+-\d+-\d+-\d+-\d+-\d+-\d+/many-type-component/model,\n metadata={'foo': 'bar'} \)\n\n" + ) + + self.assertRegex( + mock_stderr.getvalue(), + outer_log_regex, + ) + # inner process logs in stdout + self.assertIn('[KFP Executor', mock_stdout.getvalue()) + self.assertIn('Got executor_input:', mock_stdout.getvalue()) + self.assertIn('Inside of my component!', mock_stdout.getvalue()) + self.assertIn('Wrote executor output file to', mock_stdout.getvalue()) + + if __name__ == '__main__': unittest.main()