From df40b8cce21b51cd6a18e614ff943300a1b7f55d Mon Sep 17 00:00:00 2001
From: Alexander Grund <alexander.grund@tu-dresden.de>
Date: Thu, 22 Jan 2026 12:44:50 +0100
Subject: [PATCH] Add option to allow missing or additional detected PyTorch
 test suites

---
 easybuild/easyblocks/p/pytorch.py | 122 +++++++++++++++++++-----------
 1 file changed, 79 insertions(+), 43 deletions(-)

diff --git a/easybuild/easyblocks/p/pytorch.py b/easybuild/easyblocks/p/pytorch.py
index 8a73b611c5e..894bd2e2d10 100755
--- a/easybuild/easyblocks/p/pytorch.py
+++ b/easybuild/easyblocks/p/pytorch.py
@@ -259,10 +259,20 @@ def extra_options():
         extra_vars.update({
             'build_type': [None, "Build type for CMake, e.g. Release."
                                  "Defaults to 'Release' or 'Debug' depending on toolchainopts[debug]", CUSTOM],
-            'custom_opts': [[], "List of options for the build/install command. Can be used to change the defaults " +
+            'custom_opts': [[], "List of options for the build/install command. Can be used to change the defaults "
                                 "set by the PyTorch EasyBlock, for example ['USE_MKLDNN=0'].", CUSTOM],
             'excluded_tests': [{}, "Mapping of architecture strings to list of tests to be excluded", CUSTOM],
             'max_failed_tests': [10, "Maximum number of failing tests", CUSTOM],
+            # Relax checking of failed test suites (files)
+            'allow_extra_failures': [True, "Do not fail if more failing test suites in XML files are found than shown"
+                                           " in stdout of the test command. Can overestimate number of failed tests."
+                                           " Can be set to a number of maximum allowed extra failures.",
+                                           CUSTOM],
+            'allow_missing_failures': [False, "Do not fail if a failing test suite/file, as shown in stdout of the"
+                                              " test command, is not found in the XML files."
+                                              " As this also happens when tests fail to start at all,"
+                                              " it can miss a large number of failed tests."
+                                              " Can be set to a number of maximum allowed missing failures.", CUSTOM],
         })
 
         # disable use of pip to install PyTorch by default, overwriting the default set in PythonPackage;
@@ -703,17 +713,30 @@ def suite_is_in_xml_results(suite_name):
 
         # Create clear summary report
         # Use a list of messages we can later join together
-        failure_msgs = ['\t%s (%s)' % (suite.name, suite.summary) for suite in parsed_test_result.failed_suites]
-        # These were accounted for
-        failed_test_suites = {suite.name for suite in parsed_test_result.failed_suites}
-        # Those are all that failed according to the summary output
-        all_failed_test_suites = parsed_test_result.all_failed_suites
-        # We should have determined all failed test suites and only those.
-        # Otherwise show the mismatch and terminate later
-        if failed_test_suites != all_failed_test_suites:
-            failure_msgs.insert(0, 'Failed tests (suites/files):')
-            # Test suites where we didn't match a specific regexp and hence likely didn't count the failures
-            uncounted_test_suites = all_failed_test_suites - failed_test_suites
+        failure_msgs = []
+        # Calculate total number of unsuccesful and total tests
+        failed_test_cnt = parsed_test_result.failure_cnt + parsed_test_result.error_cnt
+        # Only add count message if we detected any failed tests
+        if failed_test_cnt > 0:
+            failure_or_failures = 'failure' if parsed_test_result.failure_cnt == 1 else 'failures'
+            error_or_errors = 'error' if parsed_test_result.error_cnt == 1 else 'errors'
+            failure_msgs.append(f"{parsed_test_result.failure_cnt} test {failure_or_failures}, "
+                                f"{parsed_test_result.error_cnt} test {error_or_errors} "
+                                f"(out of {parsed_test_result.test_cnt}):")
+        if parsed_test_result.failed_suites:
+            failure_msgs.append('Failed tests (suites/files):')
+            failure_msgs = ['\t%s (%s)' % (suite.name, suite.summary) for suite in parsed_test_result.failed_suites]
+
+        # At the end of stdout of the test command there is a summary of failed suites.
+        # We should have determined all those test suites and only those.
+        # These were accounted for:
+        failed_suites_parsed = {suite.name for suite in parsed_test_result.failed_suites}
+        # From summary:
+        failed_suites_from_summary = parsed_test_result.all_failed_suites
+        # Add all mismatches to summary
+        if failed_suites_parsed != failed_suites_from_summary:
+            # Test suites we missed when parsing and hence (likely) didn't count the failures:
+            uncounted_test_suites = failed_suites_from_summary - failed_suites_parsed
             if uncounted_test_suites:
                 failure_msgs.append('Could not count failed tests for the following test suites/files:')
                 for suite_name in sorted(uncounted_test_suites):
@@ -725,46 +748,59 @@ def suite_is_in_xml_results(suite_name):
                         reason = 'Undetected or did not run properly'
                     failure_msgs.append(f'\t{suite_name} ({reason})')
             # Test suites not included in the catch-all regexp but counted. Should be empty.
-            unexpected_test_suites = failed_test_suites - all_failed_test_suites
+            unexpected_test_suites = failed_suites_parsed - failed_suites_from_summary
             if unexpected_test_suites:
                 failure_msgs.append('Counted failures of tests from the following test suites/files that are not '
                                     'contained in the summary output of PyTorch:')
                 failure_msgs.extend(sorted(unexpected_test_suites))
 
-        # Calculate total number of unsuccesful and total tests
-        failed_test_cnt = parsed_test_result.failure_cnt + parsed_test_result.error_cnt
-        # Only add count message if we detected any failed tests
-        if failed_test_cnt > 0:
-            failure_or_failures = 'failure' if parsed_test_result.failure_cnt == 1 else 'failures'
-            error_or_errors = 'error' if parsed_test_result.error_cnt == 1 else 'errors'
-            failure_msgs.insert(0, "%d test %s, %d test %s (out of %d):" % (
-                parsed_test_result.failure_cnt, failure_or_failures,
-                parsed_test_result.error_cnt, error_or_errors,
-                parsed_test_result.test_cnt
-            ))
-
         # Assemble final report
         failure_report = '\n'.join(failure_msgs)
 
-        if failed_test_suites != all_failed_test_suites:
-            # Fail because we can't be sure how many tests failed
-            # so comparing to max_failed_tests cannot reasonably be done
-            if failed_test_suites | set(parsed_test_result.terminated_suites) == all_failed_test_suites:
-                # All failed test suites are either counted or terminated with a signal
-                msg = ('Failing because these test suites were terminated which makes it impossible '
-                       'to accurately count the failed tests: ')
-                msg += ", ".join("%s(%s)" % name_signal
-                                 for name_signal in sorted(parsed_test_result.terminated_suites.items()))
-            elif len(failed_test_suites) < len(all_failed_test_suites):
-                msg = ('Failing because not all failed tests could be determined. Tests failed to start, crashed '
-                       'or the test accounting in the PyTorch EasyBlock needs updating!\n'
-                       'Missing: ' + ', '.join(sorted(all_failed_test_suites - failed_test_suites)))
+        # On mismatch failed_test_cnt may be wrong.
+        # Fail, including the full report, or warn before comparing to max_failed_tests.
+        if failed_suites_parsed != failed_suites_from_summary:
+            def to_num(bool_or_int):
+                return float('inf') if bool_or_int is True else int(bool_or_int)
+            num_allowed_extra_failures = to_num(self.cfg['allow_extra_failures'])
+            num_allowed_missing_failures = to_num(self.cfg['allow_missing_failures'])
+            missing_suites = failed_suites_from_summary - failed_suites_parsed
+            extra_suites = failed_suites_parsed - failed_suites_from_summary
+
+            if missing_suites:
+                if missing_suites == set(parsed_test_result.terminated_suites):
+                    # All failed test suites are either counted or terminated with a signal
+                    if len(missing_suites) <= num_allowed_missing_failures:
+                        msg = f'These {len(missing_suites)} test suites were terminated,'
+                    else:
+                        msg = f'Failing because these {len(missing_suites)} test suites were terminated,'
+                    msg += ' which makes it impossible to accurately count the failed tests: '
+                    msg += ", ".join("%s(%s)" % name_signal
+                                     for name_signal in sorted(parsed_test_result.terminated_suites.items()))
+                else:
+                    if len(missing_suites) <= num_allowed_missing_failures:
+                        msg = 'Not all failed tests could be determined.'
+                    else:
+                        msg = 'Failing because not all failed tests could be determined.'
+                    msg += ('Tests failed to start, crashed or the test accounting in the '
+                            'PyTorch EasyBlock needs updating!\n'
+                            f'Missing ({len(missing_suites)}): ' + ', '.join(sorted(missing_suites)))
             else:
-                msg = ('Failing because there were unexpected failures detected: ' +
-                       ', '.join(sorted(failed_test_suites - all_failed_test_suites)))
-            raise EasyBuildError(msg + '\n' +
-                                 'You can check the test failures (in the log) manually and if they are harmless, '
-                                 'use --ignore-test-failure to make the test step pass.\n' + failure_report)
+                msg = ''
+            if extra_suites:
+                if msg:
+                    msg += '\n'  # There can be missing AND extra suites
+
+                if len(extra_suites) <= num_allowed_extra_failures:
+                    msg += f'{len(extra_suites)} unexpected failures detected: '
+                else:
+                    msg += f'Failing because there were {len(extra_suites)} unexpected failures detected: '
+                msg += ', '.join(sorted(extra_suites))
+            if len(missing_suites) > num_allowed_missing_failures or len(extra_suites) > num_allowed_extra_failures:
+                raise EasyBuildError(msg + '\n' +
+                                     'You can check the test failures (in the log) manually and if they are harmless, '
+                                     'use --ignore-test-failure to make the test step pass.\n' + failure_report)
+            print_warning(msg, log=self.log)
 
         if failed_test_cnt > 0:
             max_failed_tests = self.cfg['max_failed_tests']