huggingface · stas00 · Jul 14, 2021 · Jul 14, 2021 · Jul 14, 2021
diff --git a/tests/extended/test_trainer_ext.py b/tests/extended/test_trainer_ext.py
@@ -19,6 +19,7 @@
 import unittest
 from unittest.mock import patch
 
+from parameterized import parameterized
 from transformers.file_utils import is_apex_available
 from transformers.integrations import is_fairscale_available
 from transformers.testing_utils import (
@@ -164,48 +165,30 @@ def test_run_seq2seq_apex(self):
         # to reproduce the problem set distributed=False
         self.run_seq2seq_quick(distributed=True, extra_args_str="--fp16 --fp16_backend=apex")
 
+    @parameterized.expand(["base", "low", "high", "mixed"])
     @require_torch_multi_gpu
-    def test_trainer_log_level_replica(self):
-        log_info_string = "Running training"
-        kwargs = dict(distributed=True, predict_with_generate=False, do_eval=False, do_predict=False)
-
-        # test with the default log_level - should be info and thus log info once
-        with CaptureStderr() as cl:
-            self.run_seq2seq_quick(
-                **kwargs,
-                extra_args_str="",
-            )
-        n_matches = len(re.findall(log_info_string, cl.err))
-        self.assertEqual(n_matches, 1)
-
-        # test with low log_level and log_level_replica - should be noisy on all processes
-        # now the info string should appear twice on 2 processes
-        with CaptureStderr() as cl:
-            self.run_seq2seq_quick(
-                **kwargs,
-                extra_args_str="--log_level debug --log_level_replica debug",
-            )
-        n_matches = len(re.findall(log_info_string, cl.err))
-        self.assertEqual(n_matches, 2)
-
-        # test with high log_level and low log_level_replica
-        # now the info string should appear once only on the replica
-        with CaptureStderr() as cl:
-            self.run_seq2seq_quick(
-                **kwargs,
-                extra_args_str="--log_level error --log_level_replica debug",
-            )
-        n_matches = len(re.findall(log_info_string, cl.err))
-        self.assertEqual(n_matches, 1)
+    def test_trainer_log_level_replica(self, experiment_id):
+        # as each sub-test is slow-ish split into multiple sub-tests to avoid CI timeout
+        experiments = dict(
+            # test with the default log_level - should be info and thus log info once
+            base=dict(extra_args_str="", n_matches=1),
+            # test with low log_level and log_level_replica - should be noisy on all processes
+            # now the info string should appear twice on 2 processes
+            low=dict(extra_args_str="--log_level debug --log_level_replica debug", n_matches=2),
+            # test with high log_level and low log_level_replica
+            # now the info string should appear once only on the replica
+            high=dict(extra_args_str="--log_level error --log_level_replica debug", n_matches=1),
+            # test with high log_level and log_level_replica - should be quiet on all processes
+            mixed=dict(extra_args_str="--log_level error --log_level_replica error", n_matches=0),
+        )
 
-        # test with high log_level and log_level_replica - should be quiet on all processes
+        data = experiments[experiment_id]
+        kwargs = dict(distributed=True, predict_with_generate=False, do_eval=False, do_predict=False)
+        log_info_string = "Running training"
         with CaptureStderr() as cl:
-            self.run_seq2seq_quick(
-                **kwargs,
-                extra_args_str="--log_level error --log_level_replica error",
-            )
+            self.run_seq2seq_quick(**kwargs, extra_args_str=data["extra_args_str"])
         n_matches = len(re.findall(log_info_string, cl.err))
-        self.assertEqual(n_matches, 0)
+        self.assertEqual(n_matches, data["n_matches"])
 
     @slow
     def test_run_seq2seq_slow(self):