Generate *_wgsl.h embedded shaders from *.wgsl (#19981)

JulianCloudNTH · facebook-github-bot · commit fc0ba688c62e · 2026-06-04T14:40:03.000-07:00
Summary:

Adds `backends/webgpu/scripts/gen_wgsl_headers.py` to generate each `runtime/ops/&lt;op&gt;/&lt;shader&gt;_wgsl.h` from its `&lt;shader&gt;.wgsl`, so each WGSL shader has a single canonical source instead of a hand-maintained embedded copy that can silently drift. Each header embeds the shader verbatim (`inline constexpr const char* k&lt;Op&gt;WGSL = R"(...)";` plus `k&lt;Op&gt;WorkgroupSize` parsed from `workgroup_size`) and a `// wgsl-sha256:` of the source; `--check` and the unit test verify each committed header against that embedded sha. Regenerates the two existing committed op headers — `binary_add_wgsl.h` and `rms_norm_wgsl.h` — into this canonical form (embedded shader bodies byte-identical). Adds `test/test_wgsl_codegen.py` (unit + drift test) and a `--check` mode wired into `test_build_webgpu.sh` that fails if any committed header is stale.

This change was authored with assistance from Claude.

Differential Revision: D107403275
diff --git a/backends/webgpu/runtime/ops/add/binary_add_wgsl.h b/backends/webgpu/runtime/ops/add/binary_add_wgsl.h
@@ -8,11 +8,12 @@
 
 #pragma once
 
-namespace executorch {
-namespace backends {
-namespace webgpu {
+#include <cstdint>
 
-// WGSL shader source for element-wise add: output = input1 + alpha * input2
+namespace executorch::backends::webgpu {
+
+// @generated from binary_add.wgsl - DO NOT EDIT.
+// wgsl-sha256: c1ceec80c8d4d3d56986ad91ce0d7f9a57cd8467b8c3aa07a28da70e51d141d9
 inline constexpr const char* kBinaryAddWGSL = R"(
 @group(0) @binding(0) var<storage, read> input1: array<f32>;
 @group(0) @binding(1) var<storage, read> input2: array<f32>;
@@ -38,6 +39,4 @@ fn main(@builtin(global_invocation_id) gid: vec3<u32>) {
 
 inline constexpr uint32_t kBinaryAddWorkgroupSize = 256;
 
-} // namespace webgpu
-} // namespace backends
-} // namespace executorch
+} // namespace executorch::backends::webgpu
diff --git a/backends/webgpu/runtime/ops/rms_norm/rms_norm_wgsl.h b/backends/webgpu/runtime/ops/rms_norm/rms_norm_wgsl.h
@@ -12,13 +12,12 @@
 
 namespace executorch::backends::webgpu {
 
-// WGSL shader source for rms_norm: y = x * w * rsqrt(mean(x^2) + eps)
-//
-// NOTE: This inline string is the runtime source of truth — it is what gets
-// passed to wgpuDeviceCreateShaderModule. The sibling `rms_norm.wgsl` file
-// exists only for editor/tooling support and must be kept identical to this
-// string by hand; there is no build-time sync.
+// @generated from rms_norm.wgsl - DO NOT EDIT.
+// wgsl-sha256: 41ea66b52f9d205e84daf7f67e489197c4242d8b78435b2248d97d547449b95f
 inline constexpr const char* kRmsNormWGSL = R"(
+// NOTE: This file is for editor/tooling support only. The runtime consumes the
+// inline copy of this shader in `rms_norm_wgsl.h` (kRmsNormWGSL). Keep the two
+// in sync by hand — any edit here must be mirrored there.
 @group(0) @binding(0) var<storage, read_write> t_out: array<f32>;
 @group(0) @binding(1) var<storage, read> t_in: array<f32>;
 @group(0) @binding(2) var<storage, read> t_weight: array<f32>;
diff --git a/backends/webgpu/scripts/gen_wgsl_headers.py b/backends/webgpu/scripts/gen_wgsl_headers.py
@@ -0,0 +1,167 @@
+#!/usr/bin/env python3
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""Generate runtime/ops/<op>/<stem>_wgsl.h from each <stem>.wgsl.
+
+Each header embeds the shader verbatim as `inline constexpr const char*
+k<Pascal>WGSL` plus `k<Pascal>WorkgroupSize` (parsed from @workgroup_size).
+
+Usage:
+  gen_wgsl_headers.py            # (re)write all <stem>_wgsl.h
+  gen_wgsl_headers.py --check    # exit 1 if any committed header is stale
+
+Stdlib only (the devserver has no third-party pip).
+"""
+
+import argparse
+import hashlib
+import re
+import sys
+from pathlib import Path
+
+BACKEND_ROOT = Path(__file__).resolve().parents[1]
+
+_SHA_RE = re.compile(r"// wgsl-sha256: ([0-9a-f]{64})")
+
+_BSD_HEADER = """\
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ * All rights reserved.
+ *
+ * This source code is licensed under the BSD-style license found in the
+ * LICENSE file in the root directory of this source tree.
+ */"""
+
+
+def symbol_base(stem: str) -> str:
+    """snake_case shader stem -> PascalCase symbol base (binary_add -> BinaryAdd)."""
+    return "".join(part.capitalize() for part in stem.split("_"))
+
+
+_INT_LITERAL_RE = re.compile(r"^(\d+)[uUiI]?$")
+
+
+def parse_workgroup_size(src: str) -> int:
+    """Resolve the x dim of @workgroup_size: a literal, or an override/const ident.
+
+    Accepts WGSL suffix-typed integer literals (e.g. `64u`, `64i`) both inside
+    `@workgroup_size(...)` and on the right-hand side of an `override`/`const`.
+    The type annotation on `override`/`const` is optional.
+    """
+    m = re.search(r"@workgroup_size\(\s*([A-Za-z0-9_]+)", src)
+    if not m:
+        raise ValueError("no @workgroup_size found")
+    tok = m.group(1)
+    lit = _INT_LITERAL_RE.match(tok)
+    if lit:
+        return int(lit.group(1))
+    m2 = re.search(
+        r"(?:override|const)\s+"
+        + re.escape(tok)
+        + r"\s*(?::\s*u32\s*)?=\s*(\d+)[uUiI]?",
+        src,
+    )
+    if not m2:
+        raise ValueError(f"cannot resolve @workgroup_size identifier '{tok}'")
+    return int(m2.group(1))
+
+
+def wgsl_sha256(wgsl_text: str) -> str:
+    return hashlib.sha256(wgsl_text.encode("utf-8")).hexdigest()
+
+
+def embedded_sha256(header_text: str) -> str:
+    m = _SHA_RE.search(header_text)
+    return m.group(1) if m else ""
+
+
+def render_header(wgsl_path, wgsl_text: str) -> str:
+    """Render the full <stem>_wgsl.h text for a shader (shader embedded verbatim)."""
+    if ')"' in wgsl_text:
+        raise ValueError('shader contains )" which would close the R"( literal')
+    stem = Path(wgsl_path).stem
+    base = symbol_base(stem)
+    n = parse_workgroup_size(wgsl_text)
+
+    head = [
+        _BSD_HEADER,
+        "",
+        "#pragma once",
+        "",
+        "#include <cstdint>",
+        "",
+        "namespace executorch::backends::webgpu {",
+        "",
+        f"// @generated from {stem}.wgsl - DO NOT EDIT.",
+        f"// wgsl-sha256: {wgsl_sha256(wgsl_text)}",
+        f'inline constexpr const char* k{base}WGSL = R"(',
+    ]
+    return (
+        "\n".join(head)
+        + "\n"
+        + wgsl_text
+        + ')";'
+        + "\n\n"
+        + f"inline constexpr uint32_t k{base}WorkgroupSize = {n};\n\n"
+        + "} // namespace executorch::backends::webgpu\n"
+    )
+
+
+def discover():
+    """All shader sources under runtime/ops, sorted."""
+    return sorted((BACKEND_ROOT / "runtime/ops").glob("**/*.wgsl"))
+
+
+def main(argv=None) -> int:
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument(
+        "--check",
+        action="store_true",
+        help="verify committed headers match (exit 1 on drift)",
+    )
+    args = parser.parse_args(argv)
+
+    stale = []
+    missing = []
+    errors = []
+    for wgsl in discover():
+        wgsl_text = wgsl.read_text()
+        try:
+            want = render_header(wgsl, wgsl_text)
+        except ValueError as e:
+            errors.append(f"{wgsl.relative_to(BACKEND_ROOT)}: {e}")
+            continue
+        header = wgsl.with_name(wgsl.stem + "_wgsl.h")
+        if header.exists() and embedded_sha256(header.read_text()) == wgsl_sha256(
+            wgsl_text
+        ):
+            continue
+        if args.check:
+            (missing if not header.exists() else stale).append(header)
+        else:
+            header.write_text(want)
+
+    if errors:
+        print("Cannot generate header (malformed shader):")
+        for e in errors:
+            print(f"  {e}")
+        return 1
+    if args.check and (stale or missing):
+        if missing:
+            print("Missing embedded WGSL headers (run scripts/gen_wgsl_headers.py):")
+            for h in missing:
+                print(f"  {h.relative_to(BACKEND_ROOT)}")
+        if stale:
+            print("Stale embedded WGSL headers (run scripts/gen_wgsl_headers.py):")
+            for h in stale:
+                print(f"  {h.relative_to(BACKEND_ROOT)}")
+        return 1
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/backends/webgpu/test/test_build_webgpu.sh b/backends/webgpu/test/test_build_webgpu.sh
@@ -15,6 +15,10 @@ EXECUTORCH_ROOT="$(cd "${SCRIPT_DIR}/../../.." && pwd)"
 PYTHON_EXECUTABLE="${PYTHON_EXECUTABLE:-python3}"
 NPROC=$(nproc 2>/dev/null || sysctl -n hw.ncpu)
 
+echo "=== Check embedded WGSL headers are up to date ==="
+"${PYTHON_EXECUTABLE}" "${SCRIPT_DIR}/../scripts/gen_wgsl_headers.py" --check \
+  || { echo "ERROR: *_wgsl.h out of sync with .wgsl; run scripts/gen_wgsl_headers.py"; exit 1; }
+
 # ── Step 1: Python export tests ──────────────────────────────────────────────
 
 echo "=== Step 1: Run Python export tests ==="
diff --git a/backends/webgpu/test/test_wgsl_codegen.py b/backends/webgpu/test/test_wgsl_codegen.py
@@ -0,0 +1,98 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+"""Unit + drift tests for the embedded-WGSL-header generator.
+
+Loads the generator by file path (no package/namespace dependency).
+"""
+
+import hashlib
+import importlib.util
+import unittest
+from pathlib import Path
+
+_GEN = Path(__file__).resolve().parents[1] / "scripts" / "gen_wgsl_headers.py"
+_spec = importlib.util.spec_from_file_location("gen_wgsl_headers", _GEN)
+g = importlib.util.module_from_spec(_spec)
+_spec.loader.exec_module(g)
+
+
+class WgslCodegenTest(unittest.TestCase):
+    def test_symbol_base(self) -> None:
+        self.assertEqual(g.symbol_base("binary_add"), "BinaryAdd")
+        self.assertEqual(
+            g.symbol_base("sdpa_compute_attn_weights"), "SdpaComputeAttnWeights"
+        )
+        self.assertEqual(g.symbol_base("update_cache"), "UpdateCache")
+        self.assertEqual(g.symbol_base("rms_norm"), "RmsNorm")
+
+    def test_parse_workgroup_literal(self) -> None:
+        self.assertEqual(
+            g.parse_workgroup_size("@compute @workgroup_size(64, 1, 1)\nfn main(){}"),
+            64,
+        )
+
+    def test_parse_workgroup_override_indirection(self) -> None:
+        src = "override wg_size: u32 = 256;\n@compute @workgroup_size(wg_size)\nfn main(){}"
+        self.assertEqual(g.parse_workgroup_size(src), 256)
+
+    def test_parse_workgroup_suffix_typed_literal(self) -> None:
+        self.assertEqual(
+            g.parse_workgroup_size("@compute @workgroup_size(64u, 1, 1)\nfn main(){}"),
+            64,
+        )
+
+    def test_parse_workgroup_const_without_type_annotation(self) -> None:
+        src = "const WG = 128u;\n@compute @workgroup_size(WG)\nfn main(){}"
+        self.assertEqual(g.parse_workgroup_size(src), 128)
+
+    def test_parse_workgroup_not_fooled_by_const(self) -> None:
+        # rms_norm/softmax shape: a sibling `const WG_SIZE` beside a LITERAL size.
+        src = (
+            "const WG_SIZE: u32 = 64u;\n@compute @workgroup_size(64, 1, 1)\nfn main(){}"
+        )
+        self.assertEqual(g.parse_workgroup_size(src), 64)
+
+    def test_render_header_shape(self) -> None:
+        wgsl = "@compute @workgroup_size(64, 1, 1)\nfn main(){}\n"
+        h = g.render_header(Path("runtime/ops/update_cache/update_cache.wgsl"), wgsl)
+        self.assertIn("#pragma once", h)
+        self.assertIn("#include <cstdint>", h)
+        self.assertIn("namespace executorch::backends::webgpu {", h)
+        self.assertIn("// @generated from update_cache.wgsl - DO NOT EDIT.", h)
+        self.assertIn('inline constexpr const char* kUpdateCacheWGSL = R"(', h)
+        self.assertIn("inline constexpr uint32_t kUpdateCacheWorkgroupSize = 64;", h)
+        self.assertNotIn("Confidential", h)
+        # the shader is embedded verbatim:
+        body = h.split('R"(', 1)[1].split(')";', 1)[0]
+        self.assertEqual(body, "\n" + wgsl)
+        self.assertTrue(h.endswith("\n"))
+
+    def test_render_header_embeds_sha256(self) -> None:
+        wgsl = "@compute @workgroup_size(64, 1, 1)\nfn main(){}\n"
+        h = g.render_header(Path("runtime/ops/update_cache/update_cache.wgsl"), wgsl)
+        want = hashlib.sha256(wgsl.encode("utf-8")).hexdigest()
+        self.assertIn(f"// wgsl-sha256: {want}", h)
+        self.assertEqual(g.embedded_sha256(h), want)
+        self.assertEqual(g.wgsl_sha256(wgsl), want)
+
+    def test_embedded_sha256_missing_returns_empty(self) -> None:
+        self.assertEqual(g.embedded_sha256("no sha line here\n"), "")
+
+    def test_sha256_changes_with_shader(self) -> None:
+        a = g.wgsl_sha256("@compute @workgroup_size(64, 1, 1)\nfn main(){}\n")
+        b = g.wgsl_sha256("@compute @workgroup_size(256)\nfn main(){}\n")
+        self.assertNotEqual(a, b)
+
+    def test_committed_headers_match_generator(self) -> None:
+        wgsls = g.discover()
+        self.assertGreater(len(wgsls), 0, "no .wgsl shaders discovered")
+        for wgsl in wgsls:
+            want = g.render_header(wgsl, wgsl.read_text())
+            got = wgsl.with_name(wgsl.stem + "_wgsl.h").read_text()
+            self.assertEqual(
+                got, want, f"{wgsl.stem}_wgsl.h stale; run scripts/gen_wgsl_headers.py"
+            )