Add readme test to examples

fynnsu · fynnsu · commit a1b0aea6aeaf · 2025-09-17T13:41:45.000-04:00
Signed-off-by: Fynn Schmitt-Ulms &lt;fschmitt@redhat.com&gt;
diff --git a/tests/examples/test_readmes.py b/tests/examples/test_readmes.py
@@ -0,0 +1,31 @@
+from tests.examples.utils import ReadMe
+
+from pathlib import Path
+
+import pytest
+
+
+@pytest.mark.example
+@pytest.mark.parametrize(
+    "subdir",
+    [
+        "quantization_2of4_sparse_w4a16",
+        "quantization_kv_cache",
+        "quantization_w4a16",
+        "quantization_w8a8_fp8",
+        "quantization_w8a8_int8",
+        "quantizing_moe",
+    ],
+)
+def test_readmes(subdir):
+    path = Path("examples") / subdir / "README.md"
+
+    readme = ReadMe(path)
+
+    cmd = readme.get_code_block_content(position=1, lang="bash").split()
+
+    assert cmd[0] in ["python", "python3"]
+
+    script_path = Path("examples") / subdir / cmd[1]
+
+    assert script_path.is_file(), f"Could not find script at {script_path}"
diff --git a/tests/examples/utils.py b/tests/examples/utils.py
@@ -1,6 +1,10 @@
-from typing import Union
+import re
+from typing import Union, Optional
+from pathlib import Path
 
 import pytest
+from bs4 import BeautifulSoup, ResultSet, Tag
+from cmarkgfm import github_flavored_markdown_to_html as gfm_to_html
 
 
 def requires_gpu_count(num_required_gpus: int) -> pytest.MarkDecorator:
@@ -37,3 +41,50 @@ def requires_gpu_mem(required_amount: Union[int, float]) -> pytest.MarkDecorator
         f"{actual_vram:.1f} GiB GPU memory found"
     )
     return pytest.mark.skipif(required_amount > actual_vram, reason=reason)
+
+
+class ReadMe:
+    """
+    Class representing a README (Markdown) file with methods to expedite common usage.
+    """
+
+    def __init__(self, path: Path) -> None:
+        self.path = path
+        self.content = self.path.expanduser().read_text(encoding="utf-8")
+        self.__normalize_code_fence_lang()
+        self.html = gfm_to_html(self.content)
+        self.soup = BeautifulSoup(self.html, "html.parser")
+
+    def __normalize_code_fence_lang(self):
+        """
+        Perform limited normalization on the code language of code blocks to maintain
+        consistency and simplicity with locating them.
+        """
+        self.content = re.sub(r"```(shell|bash|sh)\b", "```shell", self.content)
+
+    def get_code_blocks(self, *, lang: Optional[str] = None) -> ResultSet[Tag]:
+        """
+        Get all code blocks with language `lang`, or all code blocks if `lang` is None
+        (default).
+        :param lang: language of code block to filter by
+        :return: code block `Tag`s found in README
+        """
+        lang = "shell" if lang == "bash" else lang
+        selector = f'pre[lang="{lang}"] > code' if lang else "pre > code"
+        tags = self.soup.select(selector)
+        return tags
+
+    def get_code_block_content(
+        self, *, position: int, lang: Optional[str] = None
+    ) -> str:
+        """
+        Get contents of code block at specified position (starting with 0). Optionally
+        pass a language specifier, `lang`, to only look at code blocks highlighted for
+        that language (happens prior to indexing).
+        :param position: position of code block to get (starting at 0)
+        :param lang: language of code block to filter by
+        :return: content of the code block
+        """
+        code_blocks = self.get_code_blocks(lang=lang)
+        code = code_blocks[position].text.strip()
+        return code