add workflow to dispatch

yangw-dev · yangw-dev · commit 7efe32703fe1 · 2025-08-27T19:23:17.000-07:00
ghstack-source-id: 633724d Pull-Request: #161585
diff --git a/.ci/lumen_cli/cli/lib/common/gh_summary.py b/.ci/lumen_cli/cli/lib/common/gh_summary.py
@@ -1,11 +1,12 @@
 from __future__ import annotations
 
 import logging
-import os
 import textwrap
+import xml.etree.ElementTree as ET
 from pathlib import Path
 from typing import TYPE_CHECKING
 
+from cli.lib.common.envs_helper import get_env
 from cli.lib.common.utils import get_wheels
 from jinja2 import Template
 
@@ -16,6 +17,23 @@
 
 logger = logging.getLogger(__name__)
 
+
+# ---- Template (title + per-command failures) ----
+_TPL_FAIL_BY_CMD = Template(
+    textwrap.dedent("""\
+    ## {{ title }}
+
+    {%- for section in sections if section.failures %}
+    ### Test Command: {{ section.label }}
+
+    {%- for f in section.failures %}
+    - {{ f }}
+    {%- endfor %}
+
+    {%- endfor %}
+""")
+)
+
 _TPL_CONTENT = Template(
     textwrap.dedent("""\
     ## {{ title }}
@@ -53,8 +71,17 @@
 
 
 def gh_summary_path() -> Path | None:
-    """Return the Path to the GitHub step summary file, or None if not set."""
-    p = os.environ.get("GITHUB_STEP_SUMMARY")
+    """Return the Path to the GitHub step summary file,
+    if TEMP_GITHUB_STEP_SUMMARY is set, use that instead,
+    this happens when run jobs in docker container
+    the github flow need to make sure to output the summary to github step summary after
+    """
+    p = get_env("GITHUB_STEP_SUMMARY")
+    overrides = get_env("TEMP_GITHUB_STEP_SUMMARY")
+    if overrides:
+        p = overrides
+    if not p or not Path(p).exists():
+        return None
     return Path(p) if p else None
 
 
@@ -141,3 +168,62 @@ def render_content(
     tpl = _TPL_CONTENT
     md = tpl.render(title=title, content=content, lang=lang)
     return md
+
+
+def summarize_failures_by_test_command(
+    xml_and_labels: Iterable[tuple[str | Path, str]],
+    *,
+    title: str = "Pytest Failures by Test Command",
+    dedupe_within_command: bool = True,
+) -> bool:
+    """
+    Render a single Markdown block summarizing failures grouped by test command.
+    Returns True if anything was written, False otherwise.
+    """
+    sections: list[dict] = []
+
+    for xml_path, label in xml_and_labels:
+        xmlp = Path(xml_path)
+        if not xmlp.exists():
+            logger.warning("XML %s not found, skipping", xmlp)
+            continue
+        failed = _parse_failed(xmlp)
+        if dedupe_within_command:
+            failed = sorted(set(failed))
+
+        # collect even if empty; we'll filter in the template render
+        sections.append({"label": label, "failures": failed})
+
+    # If *all* sections are empty or we collected nothing, skip writing.
+    if not sections or all(not s["failures"] for s in sections):
+        return False
+
+    md = _TPL_FAIL_BY_CMD.render(title=title, sections=sections).rstrip() + "\n"
+    return write_gh_step_summary(md)
+
+
+def _to_name_from_testcase(tc: ET.Element) -> str:
+    name = tc.attrib.get("name", "")
+    file_attr = tc.attrib.get("file")
+    if file_attr:
+        return f"{file_attr}:{name}"
+
+    classname = tc.attrib.get("classname", "")
+    parts = classname.split(".") if classname else []
+    if len(parts) >= 1:
+        mod_parts = parts[:-1] if len(parts) >= 2 else parts
+        mod_path = "/".join(mod_parts) + ".py" if mod_parts else "unknown.py"
+        return f"{mod_path}:{name}"
+    return f"unknown.py:{name or 'unknown_test'}"
+
+
+def _parse_failed(xml_path: Path) -> list[str]:
+    if not xml_path.exists():
+        return []
+    tree = ET.parse(xml_path)
+    root = tree.getroot()
+    failed: list[str] = []
+    for tc in root.iter("testcase"):
+        if any(x.tag in {"failure", "error"} for x in tc):
+            failed.append(_to_name_from_testcase(tc))
+    return failed
diff --git a/.ci/lumen_cli/cli/lib/common/path_helper.py b/.ci/lumen_cli/cli/lib/common/path_helper.py
@@ -17,11 +17,17 @@ def get_path(path: Union[str, Path], resolve: bool = False) -> Path:
     return result.resolve() if resolve else result
 
 
-def ensure_dir_exists(path: Union[str, Path]) -> Path:
-    """Create directory if it doesn't exist."""
-    path_obj = get_path(path)
-    path_obj.mkdir(parents=True, exist_ok=True)
-    return path_obj
+def ensure_path(path: Union[str, Path], is_file: bool = False) -> Path:
+    """Ensure directory or file exists.
+    If is_file=True, create parent dirs and touch the file.
+    """
+    p = Path(path)
+    if is_file:
+        p.parent.mkdir(parents=True, exist_ok=True)
+        p.touch(exist_ok=True)
+    else:
+        p.mkdir(parents=True, exist_ok=True)
+    return p
 
 
 def remove_dir(path: Union[str, Path, None]) -> None:
@@ -36,7 +42,7 @@ def remove_dir(path: Union[str, Path, None]) -> None:
 def force_create_dir(path: Union[str, Path]) -> Path:
     """Remove directory if exists, then create fresh empty directory."""
     remove_dir(path)
-    return ensure_dir_exists(path)
+    return ensure_path(path)
 
 
 def copy(src: Union[str, Path], dst: Union[str, Path]) -> None:
diff --git a/.ci/lumen_cli/cli/lib/common/utils.py b/.ci/lumen_cli/cli/lib/common/utils.py
@@ -4,13 +4,16 @@
 
 import logging
 import os
+import secrets
 import shlex
 import subprocess
 import sys
 from contextlib import contextmanager
 from pathlib import Path
 from typing import Optional
 
+from cli.lib.common.path_helper import ensure_path
+
 
 logger = logging.getLogger(__name__)
 
@@ -137,3 +140,42 @@ def get_wheels(
                 relpath = str((Path(dirpath) / fname).relative_to(root))
                 items.append({"pkg": pkg, "relpath": relpath})
     return items
+
+
+def attach_junitxml_if_pytest(
+    cmd: str,
+    dir: Optional[Path],
+    prefix: str,
+    *,
+    ensure_unique: bool = False,
+    resolve_xml: bool = False,
+) -> tuple[str, Optional[Path]]:
+    """
+    Append --junitxml=<ABS_PATH> to a pytest command string.
+    The XML filename is <prefix>_<random-hex>.xml.
+
+    - dir: target folder (will be created), if None, skip the junitxml attachment
+    - prefix: filename prefix (e.g., "junit" -> junit_ab12cd34.xml)
+    - ensure_unique: if True, regenerate a hash with 8 characters
+
+    Returns: (amended_cmd, abs_xml_path)
+    """
+    if "pytest" not in cmd:
+        return cmd, None
+    if dir is None:
+        return cmd, None
+    ensure_path(dir)
+
+    file_name_prefix = f"{prefix}"
+    if ensure_unique:
+        file_name_prefix += f"_{unique_hex(8)}"
+    xml_path = dir / f"{file_name_prefix}_junit_pytest.xml"
+    if resolve_xml:
+        xml_path = xml_path.resolve()
+
+    return f"{cmd} --junitxml={xml_path.as_posix()}", xml_path
+
+
+def unique_hex(length: int = 8) -> str:
+    """Return a random hex string of `length` characters."""
+    return secrets.token_hex((length + 1) // 2)[:length]
diff --git a/.ci/lumen_cli/cli/lib/core/vllm/lib.py b/.ci/lumen_cli/cli/lib/core/vllm/lib.py
@@ -1,12 +1,18 @@
 import logging
 import os
 import textwrap
-from typing import Any
+from pathlib import Path
+from typing import Any, Optional
 
 from cli.lib.common.gh_summary import write_gh_step_summary
 from cli.lib.common.git_helper import clone_external_repo
 from cli.lib.common.pip_helper import pip_install_packages
-from cli.lib.common.utils import run_command, temp_environ, working_directory
+from cli.lib.common.utils import (
+    attach_junitxml_if_pytest,
+    run_command,
+    temp_environ,
+    working_directory,
+)
 from jinja2 import Template
 
 
@@ -186,6 +192,9 @@ def run_test_plan(
     tests_map: dict[str, Any],
     shard_id: int = 0,
     num_shards: int = 0,
+    *,
+    test_summary_path: Optional[Path] = None,
+    test_summary_result: Optional[list[tuple[str, str]]] = None,
 ):
     """
     a method to run list of tests based on the test plan.
@@ -198,7 +207,6 @@ def run_test_plan(
     tests = tests_map[test_plan]
     pkgs = tests.get("package_install", [])
     title = tests.get("title", "unknown test")
-
     is_parallel = check_parallelism(tests, title, shard_id, num_shards)
     if is_parallel:
         title = title.replace("%N", f"{shard_id}/{num_shards}")
@@ -212,7 +220,15 @@ def run_test_plan(
         temp_environ(tests.get("env_vars", {})),
     ):
         failures = []
-        for step in tests["steps"]:
+        for idx, step in enumerate(tests["steps"]):
+            # generate xml report for each test for test summary if needed
+            step, xml_file_path = attach_junitxml_if_pytest(
+                cmd=step, dir=test_summary_path, prefix=f"{test_plan}_{idx}"
+            )
+            if xml_file_path and xml_file_path.exists() and test_summary_result:
+                test_summary_result.append((title, str(xml_file_path)))
+            else:
+                logger.info("No test report will be generate for %s", step)
             logger.info("Running step: %s", step)
             if is_parallel:
                 step = replace_buildkite_placeholders(step, shard_id, num_shards)
diff --git a/.ci/lumen_cli/cli/lib/core/vllm/vllm_build.py b/.ci/lumen_cli/cli/lib/core/vllm/vllm_build.py
@@ -20,7 +20,7 @@
 )
 from cli.lib.common.path_helper import (
     copy,
-    ensure_dir_exists,
+    ensure_path,
     force_create_dir,
     get_path,
     is_path_exist,
@@ -165,7 +165,7 @@ def run(self):
         self.cp_torch_whls_if_exist(inputs)
 
         # make sure the output dir to store the build artifacts exist
-        ensure_dir_exists(Path(inputs.output_dir))
+        ensure_path(Path(inputs.output_dir))
 
         cmd = self._generate_docker_build_cmd(inputs)
         logger.info("Running docker build: \n %s", cmd)
diff --git a/.ci/lumen_cli/cli/lib/core/vllm/vllm_test.py b/.ci/lumen_cli/cli/lib/core/vllm/vllm_test.py
@@ -11,15 +11,24 @@
 
 from cli.lib.common.cli_helper import BaseRunner
 from cli.lib.common.envs_helper import env_path_field, env_str_field, get_env
+from cli.lib.common.gh_summary import (
+    gh_summary_path,
+    summarize_failures_by_test_command,
+)
 from cli.lib.common.path_helper import copy, remove_dir
 from cli.lib.common.pip_helper import (
     pip_install_first_match,
     pip_install_packages,
     pkg_exists,
     run_python,
 )
-from cli.lib.common.utils import run_command, working_directory
-from cli.lib.core.vllm.lib import clone_vllm, run_test_plan, sample_vllm_test_library
+from cli.lib.common.utils import ensure_path, run_command, working_directory
+from cli.lib.core.vllm.lib import (
+    clone_vllm,
+    run_test_plan,
+    sample_vllm_test_library,
+    summarize_build_info,
+)
 
 
 logger = logging.getLogger(__name__)
@@ -41,13 +50,20 @@ class VllmTestParameters:
         "VLLM_WHEELS_PATH", "./dist/external/vllm/wheels"
     )
 
+    # generate a file to store test summary
+    test_summary_file: Path = env_path_field(
+        "TEMP_GITHUB_STEP_SUMMARY", "./generated_step_summary.md"
+    )
+
     torch_cuda_arch_list: str = env_str_field("TORCH_CUDA_ARCH_LIST", "8.9")
 
     def __post_init__(self):
         if not self.torch_whls_path.exists():
             raise ValueError("missing torch_whls_path")
         if not self.vllm_whls_path.exists():
             raise ValueError("missing vllm_whls_path")
+        if self.test_summary_file:
+            ensure_path(self.test_summary_file, is_file=True)
 
 
 class TestInpuType(Enum):
@@ -91,33 +107,54 @@ def prepare(self):
         logger.info("Display VllmTestParameters %s", params)
         self._set_envs(params)
 
-        clone_vllm(dst=self.work_directory)
+        vllm_commit = clone_vllm(dst=self.work_directory)
         with working_directory(self.work_directory):
             remove_dir(Path("vllm"))
             self._install_wheels(params)
             self._install_dependencies()
         # verify the torches are not overridden by test dependencies
         check_versions()
+        return vllm_commit
 
     def run(self):
         """
         main function to run vllm test
         """
-        self.prepare()
-        with working_directory(self.work_directory):
-            if self.test_type == TestInpuType.TEST_PLAN:
-                if self.num_shards > 1:
+        vllm_commit = self.prepare()
+
+        # prepare test summary
+        test_summary_path = Path("tmp_pytest_report").resolve()
+        ensure_path(test_summary_path)
+        test_summary_result = []
+
+        try:
+            with working_directory(self.work_directory):
+                if self.test_type == TestInpuType.TEST_PLAN:
                     run_test_plan(
                         self.test_plan,
                         "vllm",
                         sample_vllm_test_library(),
                         self.shard_id,
                         self.num_shards,
+                        test_summary_path=test_summary_path,
+                        test_summary_result=test_summary_result,
                     )
                 else:
-                    run_test_plan(self.test_plan, "vllm", sample_vllm_test_library())
-            else:
-                raise ValueError(f"Unknown test type {self.test_type}")
+                    raise ValueError(f"Unknown test type {self.test_type}")
+        except Exception as e:
+            logger.error("Failed to run vllm test: %s", e)
+            raise e
+        finally:
+            self.vllm_test_gh_summary(vllm_commit, test_summary_result)
+
+    def vllm_test_gh_summary(
+        self, vllm_commit: str, test_summary_results: list[tuple[str, str]]
+    ):
+        if not gh_summary_path():
+            return logger.info("Skipping, not detect GH Summary env var....")
+        logger.info("Generate GH Summary ...")
+        summarize_build_info(vllm_commit)
+        summarize_failures_by_test_command(test_summary_results)
 
     def _install_wheels(self, params: VllmTestParameters):
         logger.info("Running vllm test with inputs: %s", params)
diff --git a/.ci/lumen_cli/tests/test_path_helper.py b/.ci/lumen_cli/tests/test_path_helper.py
diff --git a/.ci/lumen_cli/tests/test_vllm.py b/.ci/lumen_cli/tests/test_vllm.py
diff --git a/.github/workflows/_linux-test.yml b/.github/workflows/_linux-test.yml