enh: Add script to map tests <-> jenkins stages & vice-versa (#5177)

venkywonka · chzblych · web-flow · commit 22d4a8c48a3f · 2025-07-19T00:50:40.000+08:00
Signed-off-by: Venky Ganesh &lt;23023424+venkywonka@users.noreply.github.com&gt;
Signed-off-by: Yanchao Lu &lt;yanchaol@nvidia.com&gt;
Co-authored-by: Yanchao Lu &lt;yanchaol@nvidia.com&gt;
diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md
@@ -70,7 +70,8 @@ Launch build/test pipelines. All previously running jobs will be killed.
 
 `--debug ` *(OPTIONAL)* : **Experimental feature**. Enable access to the CI container for debugging purpose. Note: Specify exactly one stage in the `stage-list` parameter to access the appropriate container environment. Note: Does **NOT** update GitHub check status.
 
-For guidance on mapping tests to stage names, see `docs/source/reference/ci-overview.md`.
+For guidance on mapping tests to stage names, see `docs/source/reference/ci-overview.md`
+and the `scripts/test_to_stage_mapping.py` helper.
 
 ### kill
 
diff --git a/docs/source/reference/ci-overview.md b/docs/source/reference/ci-overview.md
@@ -55,9 +55,27 @@ The array elements are: GPU type, YAML file (without extension), shard index, an
 2. Search `jenkins/L0_Test.groovy` for a stage whose YAML file matches (for example `l0_a100`) and whose name contains `[Post-Merge]` if the YAML entry uses `stage: post_merge`.
 3. The resulting stage name(s) are what you pass to Jenkins via the `stage_list` parameter when triggering a job.
 
-### Example
+### Using `test_to_stage_mapping.py`
+
+Manually searching YAML and Groovy files can be tedious.  The helper script
+`scripts/test_to_stage_mapping.py` automates the lookup:
+
+```bash
+python scripts/test_to_stage_mapping.py --tests "triton_server/test_triton.py::test_gpt_ib_ptuning[gpt-ib-ptuning]"
+python scripts/test_to_stage_mapping.py --tests gpt_ib_ptuning
+python scripts/test_to_stage_mapping.py --stages A100X-Triton-Post-Merge-1
+python scripts/test_to_stage_mapping.py --test-list my_tests.txt
+python scripts/test_to_stage_mapping.py --test-list my_tests.yml
+```
+
+The first two commands print the Jenkins stages that run the specified tests or
+patterns. Patterns are matched by substring, so partial test names are
+supported out of the box. The third lists every test executed in the given stage. When
+providing tests on the command line, quote each test string so the shell does
+not interpret the `[` and `]` characters as globs. Alternatively, store the
+tests in a newline‑separated text file or a YAML list and supply it with
+`--test-list`.
 
-`triton_server/test_triton.py::test_gpt_ib_ptuning[gpt-ib-ptuning]` appears in `l0_a100.yml` under `stage: post_merge` and `backend: triton`.  The corresponding Jenkins stages are `A100X-Triton-[Post-Merge]-1` and `A100X-Triton-[Post-Merge]-2` (two shards).
 
 To run the same tests on your pull request, comment:
 
@@ -67,6 +85,7 @@ To run the same tests on your pull request, comment:
 
 This executes the same tests that run post-merge for this hardware/backend.
 
+
 ## Waiving tests
 
 Sometimes a test is known to fail due to a bug or unsupported feature. Instead
diff --git a/jenkins/L0_Test.groovy b/jenkins/L0_Test.groovy
@@ -1710,6 +1710,24 @@ def runInKubernetes(pipeline, podSpec, containerName)
 def launchTestJobs(pipeline, testFilter, dockerNode=null)
 {
     def dockerArgs = "-v /mnt/scratch.trt_llm_data:/scratch.trt_llm_data:ro -v /tmp/ccache:${CCACHE_DIR}:rw -v /tmp/pipcache/http-v2:/root/.cache/pip/http-v2:rw --cap-add syslog"
+
+    // IMPORTANT: Stage Configuration Syntax Requirement
+    //
+    // The test_to_stage_mapping.py script expects stage definitions in the following format:
+    // "Stage-Name": ["platform", "yaml_file", split_id, split_count, gpu_count]
+    //
+    // Where:
+    // - Stage-Name: Must be quoted string, used to identify the Jenkins stage
+    // - platform: Hardware platform identifier (e.g., "a10", "h100-cr")
+    // - yaml_file: Test database YAML filename without .yml extension (e.g., "l0_a10")
+    // - split_id: Current split number (1-based)
+    // - split_count: Total number of splits
+    // - gpu_count: Number of GPUs required (optional, defaults to 1)
+    //
+    // This format is parsed by scripts/test_to_stage_mapping.py to provide bidirectional
+    // mapping between test names and Jenkins stage names. Any changes to this syntax
+    // may break the mapping functionality.
+
     x86TestConfigs = [
         "DGX_H100-4_GPUs-PyTorch-DeepSeek-1": ["dgx-h100-x4", "l0_dgx_h100", 1, 2, 4],
         "DGX_H100-4_GPUs-PyTorch-DeepSeek-2": ["dgx-h100-x4", "l0_dgx_h100", 2, 2, 4],
diff --git a/scripts/dco_check.py b/scripts/dco_check.py
@@ -22,7 +22,7 @@ def commit_message_has_signoff(message):
 
 def main():
     if len(sys.argv) != 2:
-        print("Usage: python commit-msg.py <commit message filename>")
+        print("Usage: python dco_check.py <commit message filename>")
         sys.exit(1)
 
     # Read the commit message from the file passed as an argument by Git
diff --git a/scripts/test_to_stage_mapping.py b/scripts/test_to_stage_mapping.py
@@ -0,0 +1,266 @@
+"""Lookup Jenkins stage names for integration tests and vice versa.
+
+This helper parses ``jenkins/L0_Test.groovy`` and the YAML files under
+``tests/integration/test_lists/test-db`` to provide a bidirectional mapping
+between test names and Jenkins stage names. When ``--tests`` or ``--test-list``
+options are used, each value is treated as a substring pattern. Any test whose
+fully qualified name contains the pattern will be matched. If the pattern
+corresponds exactly to a test name, it naturally matches that test as well.
+
+Example usage::
+
+   python scripts/test_to_stage_mapping.py --tests \\
+       "triton_server/test_triton.py::test_gpt_ib_ptuning[gpt-ib-ptuning]"
+   python scripts/test_to_stage_mapping.py --tests gpt_ib_ptuning
+   python scripts/test_to_stage_mapping.py --stages \\
+       A100X-Triton-Post-Merge-1
+
+Tests can also be provided via ``--test-list`` pointing to either a plain text
+file or a YAML list file. Quote individual test names on the command line so
+the shell does not interpret ``[`` and ``]`` characters.
+"""
+
+import argparse
+import os
+import re
+from collections import defaultdict
+from glob import glob
+from typing import List
+
+import yaml
+
+
+def _load_tests_file(path: str) -> List[str]:
+    tests: List[str] = []
+    yaml_mode = path.endswith('.yml') or path.endswith('.yaml')
+    with open(path, 'r') as f:
+        for line in f:
+            line = line.strip()
+            if not line or line.startswith('#'):
+                continue
+            if yaml_mode:
+                if line.startswith('- '):
+                    tests.append(line[2:].strip())
+            else:
+                tests.append(line)
+    return tests
+
+
+# Regex to parse Jenkins stage configurations from Groovy files
+# Matches patterns like: "Stage-Name": ["platform", "yaml_file", split_id, split_count, gpu_count]
+#
+# Pattern breakdown:
+#   "(?P<stage>[^"]+)"     - Captures stage name in quotes (group 'stage')
+#   \s*:\s*               - Matches colon with optional whitespace
+#   \[                    - Matches opening bracket
+#   "[^"]+"              - Matches platform string in quotes (ignored)
+#   ,\s*                 - Matches comma with optional whitespace
+#   "(?P<yml>[^"]+)"     - Captures yaml filename in quotes (group 'yml')
+#   (?:,\s*\d+)*         - Matches zero or more comma-separated numbers (split_id, split_count, gpu_count)
+#   \s*\]                - Matches closing bracket with optional whitespace
+_STAGE_RE = re.compile(
+    r'"(?P<stage>[^"]+)"\s*:\s*\["[^"]+",\s*"(?P<yml>[^"]+)"(?:,\s*\d+)*\s*\]')
+
+
+def _extract_terms(entry):
+    """Extract terms from either direct 'terms' or 'condition.terms'."""
+    terms = entry.get('terms', {})
+    if not terms:
+        terms = entry.get('condition', {}).get('terms', {})
+    return terms
+
+
+class StageQuery:
+
+    def __init__(self, groovy_path: str, test_db_dir: str):
+        self.stage_to_yaml, self.yaml_to_stages = self._parse_stage_mapping(
+            groovy_path)
+        self.test_map, self.yaml_stage_tests = self._parse_tests(test_db_dir)
+        # Build dynamic backend mapping from discovered data
+        self._backend_keywords = self._discover_backend_keywords()
+
+    @staticmethod
+    def _parse_stage_mapping(path):
+        stage_to_yaml = {}
+        yaml_to_stages = defaultdict(list)
+        with open(path, 'r') as f:
+            for line in f:
+                m = _STAGE_RE.search(line)
+                if m:
+                    stage = m.group('stage')
+                    yml = m.group('yml') + '.yml'
+                    stage_to_yaml[stage] = yml
+                    yaml_to_stages[yml].append(stage)
+        return stage_to_yaml, yaml_to_stages
+
+    def _parse_tests(self, db_dir):
+        """Parse tests from YAML files, supporting both .yml and .yaml."""
+        test_map = defaultdict(list)
+        yaml_stage_tests = defaultdict(lambda: defaultdict(list))
+
+        yaml_files = (glob(os.path.join(db_dir, '*.yml')) +
+                      glob(os.path.join(db_dir, '*.yaml')))
+
+        for path in yaml_files:
+            with open(path, 'r') as f:
+                data = yaml.safe_load(f)
+            for key, entries in data.items():
+                if key == 'version' or entries is None:
+                    continue
+                for entry in entries:
+                    terms = _extract_terms(entry)
+
+                    stage = terms.get('stage')
+                    if stage is None:
+                        continue
+
+                    backend = terms.get('backend', '')  # Default to empty
+
+                    tests = entry.get('tests', [])
+                    yml = os.path.basename(path)
+                    for t in tests:
+                        test_map[t].append((yml, stage, backend))
+                        yaml_stage_tests[yml][stage].append(t)
+        return test_map, yaml_stage_tests
+
+    def _discover_backend_keywords(self):
+        """Discover backend keywords from existing data dynamically."""
+        backend_keywords = {}
+
+        # Collect all backends from test data
+        all_backends = set()
+        for mappings in self.test_map.values():
+            for yml, stage_type, backend in mappings:
+                if backend and backend.strip():
+                    all_backends.add(backend.strip().lower())
+
+        # Map backends to their likely stage name keywords
+        for backend in all_backends:
+            backend_keywords[backend] = backend.upper()
+
+        # Add common variations/aliases
+        aliases = {
+            'tensorrt': ['TENSORRT', 'TRT'],
+            'pytorch': ['PYTORCH', 'TORCH'],
+            'cpp': ['CPP', 'C++'],
+            'triton': ['TRITON']
+        }
+
+        for backend, keywords in aliases.items():
+            if backend in backend_keywords:
+                backend_keywords[backend] = keywords
+
+        return backend_keywords
+
+    def search_tests(self, pattern: str):
+        parts = pattern.split()
+        result = []
+        for test in self.test_map:
+            name = test.lower()
+            if all(p.lower() in name for p in parts):
+                result.append(test)
+        return result
+
+    def tests_to_stages(self, tests):
+        result = set()
+        for t in tests:
+            for yml, stage_type, backend in self.test_map.get(t, []):
+                for s in self.yaml_to_stages.get(yml, []):
+                    if stage_type == 'post_merge' and 'Post-Merge' not in s:
+                        continue
+                    if stage_type == 'pre_merge' and 'Post-Merge' in s:
+                        continue
+
+                    # Filter by backend if specified
+                    if backend and backend != '':
+                        backend_keywords = self._backend_keywords.get(
+                            backend.lower(), [backend.upper()])
+                        if isinstance(backend_keywords, str):
+                            backend_keywords = [backend_keywords]
+
+                        if not any(keyword in s.upper()
+                                   for keyword in backend_keywords):
+                            continue
+
+                    result.add(s)
+        return sorted(result)
+
+    def stages_to_tests(self, stages):
+        result = set()
+        for s in stages:
+            yml = self.stage_to_yaml.get(s)
+            if not yml:
+                continue
+            stage_type = 'post_merge' if 'Post-Merge' in s else 'pre_merge'
+
+            # Determine expected backend dynamically from stage name
+            expected_backend = None
+            stage_upper = s.upper()
+            for backend, keywords in self._backend_keywords.items():
+                if isinstance(keywords, str):
+                    keywords = [keywords]
+                if any(keyword in stage_upper for keyword in keywords):
+                    expected_backend = backend
+                    break
+
+            # Get all tests for yml/stage_type, then filter by backend
+            all_tests = self.yaml_stage_tests.get(yml, {}).get(stage_type, [])
+            for test in all_tests:
+                # Check if test's backend matches stage's expected backend
+                test_mappings = self.test_map.get(test, [])
+                for test_yml, test_stage, test_backend in test_mappings:
+                    if (test_yml == yml and test_stage == stage_type
+                            and (expected_backend is None
+                                 or test_backend == expected_backend)):
+                        result.add(test)
+                        break
+        return sorted(result)
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description='Map Jenkins stages to tests and vice versa.')
+    group = parser.add_mutually_exclusive_group(required=True)
+    group.add_argument(
+        '--tests',
+        nargs='+',
+        help='One or more test name patterns to resolve to Jenkins stages')
+    group.add_argument(
+        '--test-list',
+        help=('File with test name patterns, either newline separated '
+              'or a YAML list'))
+    group.add_argument('--stages',
+                       nargs='+',
+                       help='List of stage names to look up')
+    parser.add_argument('--repo-root',
+                        default=os.path.dirname(os.path.dirname(__file__)),
+                        help='Path to repository root')
+    args = parser.parse_args()
+
+    groovy = os.path.join(args.repo_root, 'jenkins', 'L0_Test.groovy')
+    db_dir = os.path.join(args.repo_root, 'tests', 'integration', 'test_lists',
+                          'test-db')
+    query = StageQuery(groovy, db_dir)
+
+    if args.tests or args.test_list:
+        patterns = []
+        if args.tests:
+            patterns.extend(args.tests)
+        if args.test_list:
+            patterns.extend(_load_tests_file(args.test_list))
+
+        collected = []
+        for pat in patterns:
+            collected.extend(query.search_tests(pat))
+        tests = sorted(set(collected))
+        stages = query.tests_to_stages(tests)
+        for s in stages:
+            print(s)
+    else:
+        tests = query.stages_to_tests(args.stages)
+        for t in tests:
+            print(t)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/tests/unittest/tools/test_test_to_stage_mapping.py b/tests/unittest/tools/test_test_to_stage_mapping.py