avocado: Avoid left-over processes when test reports status

Currently when the test reports status avocado does not check whether the process finished, leaving open space for left-over test processes. This patch unifies the test process handling in case the test reported test status and allows the runner to destroy and report error in case the test process did not finish. Additionally it modifies the error message in case the test was interrupted, because the original message is IMO not clear enough (I spent quite a time analyzing how that happened and if that's an avocado bug or supported result). Signed-off-by: N Lukáš Doktor <ldoktor@redhat.com>

avocado: Avoid left-over processes when test reports status
Currently when the test reports status avocado does not check whether the process finished, leaving open space for left-over test processes. This patch unifies the test process handling in case the test reported test status and allows the runner to destroy and report error in case the test process did not finish. Additionally it modifies the error message in case the test was interrupted, because the original message is IMO not clear enough (I spent quite a time analyzing how that happened and if that's an avocado bug or supported result). Signed-off-by: N Lukáš Doktor <ldoktor@redhat.com>
d86e5912 · Lukáš Doktor · f1c6d8f5 · d86e5912 · d86e5912
隐藏空白更改
内联并排

Showing with 95 addition and 26 deletion

avocado/core/runner.py avocado/core/runner.py +37 -25

selftests/functional/test_basic.py selftests/functional/test_basic.py +58 -1

未找到文件。
--- a/avocado/core/runner.py
+++ b/avocado/core/runner.py
@@ -149,33 +149,48 @@ class TestStatus(object):
            else:       # test_status
                self.status = msg
-    def abort(self, proc, started, timeout, first, step):
+    def finish(self, proc, started, timeout, step):
        """
-        Handle job abortion
+        Wait for the test process to finish and report status or error status
+        if unable to obtain the status till deadline.
        :param proc: The test's process
        :param started: Time when the test started
        :param timeout: Timeout for waiting on status
        :param first: Delay before first check
        :param step: Step between checks for the status
        """
-        if proc.is_alive() and wait.wait_for(lambda: self.status, timeout,
+        # Wait for either process termination or test status
-                                             first, step):
+        wait.wait_for(lambda: not proc.is_alive() or self.status, timeout, 0,
-            status = self.status
+                      step)
-        else:
+        if self.status:     # status exists, wait for process to finish
-            test_state = self.early_status
+            if not wait.wait_for(lambda: not proc.is_alive(), timeout, 0,
-            test_state['time_elapsed'] = time.time() - started
+                                 step):
-            test_state['fail_reason'] = 'Test process aborted'
+                err = "Test reported status but did not finish"
-            test_state['status'] = exceptions.TestAbortError.status
+            else:   # Test finished and reported status, pass
-            test_state['fail_class'] = (exceptions.TestAbortError.__class__.
+                return self.status
-                                        __name__)
+        else:   # proc finished, wait for late status delivery
-            test_state['traceback'] = 'Traceback not available'
+            if not wait.wait_for(lambda: self.status, timeout, 0, step):
-            with open(test_state['logfile'], 'r') as log_file_obj:
+                err = "Test died without reporting the status."
-                test_state['text_output'] = log_file_obj.read()
+            else:
-            TEST_LOG.error('ERROR %s -> TestAbortedError: '
+                # Status delivered after the test process finished, pass
-                           'Test aborted unexpectedly',
+                return self.status
-                           test_state['name'])
+        # At this point there were failures, fill the new test status
-            status = test_state
+        TEST_LOG.debug("Original status: %s", str(self.status))
+        test_state = self.early_status
+        test_state['time_elapsed'] = time.time() - started
+        test_state['fail_reason'] = err
+        test_state['status'] = exceptions.TestAbortError.status
+        test_state['fail_class'] = (exceptions.TestAbortError.__class__.
+                                    __name__)
+        test_state['traceback'] = 'Traceback not available'
+        with open(test_state['logfile'], 'r') as log_file_obj:
+            test_state['text_output'] = log_file_obj.read()
+        TEST_LOG.error('ERROR %s -> TestAbortedError: '
+                       'Test process died without reporting the status.',
+                       test_state['name'])
        if proc.is_alive():
+            TEST_LOG.warning("Killing hanged test process %s" % proc.pid)
            for _ in xrange(5):     # I really want to destroy it
                os.kill(proc.pid, signal.SIGKILL)
                if not proc.is_alive():
@@ -184,7 +199,7 @@ class TestStatus(object):
            else:
                raise exceptions.TestError("Unable to destroy test's process "
                                           "(%s)" % proc.pid)
-        return status
+        return test_state
 class TestRunner(object):
@@ -370,11 +385,8 @@ class TestRunner(object):
                    os.kill(proc.pid, signal.SIGKILL)
        # Get/update the test status
-        if test_status.status:
+        test_state = test_status.finish(proc, time_started, cycle_timeout,
-            test_state = test_status.status
+                                        step)
-        else:
-            test_state = test_status.abort(proc, time_started, cycle_timeout,
-                                           first, step)
        # Try to log the timeout reason to test's results and update test_state
        if abort_reason:

--- a/selftests/functional/test_basic.py
+++ b/selftests/functional/test_basic.py
@@ -75,6 +75,27 @@ class MyTest(Test):
 '''
+REPORTS_STATUS_AND_HANG = '''
+from avocado import Test
+import time
+class MyTest(Test):
+    def test(self):
+         self.runner_queue.put({"running": False})
+         time.sleep(60)
+'''
+DIE_WITHOUT_REPORTING_STATUS = '''
+from avocado import Test
+import os
+import signal
+class MyTest(Test):
+    def test(self):
+         os.kill(os.getpid(), signal.SIGKILL)
+'''
 class RunnerOperationTest(unittest.TestCase):
    def setUp(self):
@@ -183,6 +204,42 @@ class RunnerOperationTest(unittest.TestCase):
            self.assertIn("Original fail_reason: None",
                          results["tests"][0]["fail_reason"])
+    def test_hanged_test_with_status(self):
+        """ Check that avocado handles hanged tests properly """
+        os.chdir(basedir)
+        with script.TemporaryScript("report_status_and_hang.py",
+                                    REPORTS_STATUS_AND_HANG,
+                                    "hanged_test_with_status") as tst:
+            res = process.run("./scripts/avocado run --sysinfo=off "
+                              "--job-results-dir %s %s --json -"
+                              % (self.tmpdir, tst), ignore_status=True)
+            self.assertEqual(res.exit_status, exit_codes.AVOCADO_TESTS_FAIL)
+            results = json.loads(res.stdout)
+            self.assertEqual(results["tests"][0]["status"], "ERROR",
+                             "%s != %s\n%s" % (results["tests"][0]["status"],
+                                               "ERROR", res))
+            self.assertIn("Test reported status but did not finish",
+                          results["tests"][0]["fail_reason"])
+            self.assertLess(res.duration, 40, "Test execution took too long, "
+                            "which is likely because the hanged test was not "
+                            "interrupted. Results:\n%s" % res)
+    def test_no_status_reported(self):
+        os.chdir(basedir)
+        with script.TemporaryScript("die_without_reporting_status.py",
+                                    DIE_WITHOUT_REPORTING_STATUS,
+                                    "no_status_reported") as tst:
+            res = process.run("./scripts/avocado run --sysinfo=off "
+                              "--job-results-dir %s %s --json -"
+                              % (self.tmpdir, tst), ignore_status=True)
+            self.assertEqual(res.exit_status, exit_codes.AVOCADO_TESTS_FAIL)
+            results = json.loads(res.stdout)
+            self.assertEqual(results["tests"][0]["status"], "ERROR",
+                             "%s != %s\n%s" % (results["tests"][0]["status"],
+                                               "ERROR", res))
+            self.assertIn("Test died without reporting the status",
+                          results["tests"][0]["fail_reason"])
    def test_runner_tests_fail(self):
        os.chdir(basedir)
        cmd_line = ('./scripts/avocado run --sysinfo=off --job-results-dir %s '
@@ -267,7 +324,7 @@ class RunnerOperationTest(unittest.TestCase):
                    '--xunit - abort.py' % self.tmpdir)
        result = process.run(cmd_line, ignore_status=True)
        output = result.stdout
-        excerpt = 'Test process aborted'
+        excerpt = 'Test died without reporting the status.'
        expected_rc = exit_codes.AVOCADO_TESTS_FAIL
        unexpected_rc = exit_codes.AVOCADO_FAIL
        self.assertNotEqual(result.exit_status, unexpected_rc,