Initial guest-to-host trampoline generation

2025-12-13 15:16:27 +00:00 · 2025-10-30 02:23:09 -06:00
parent 9367f003c5
commit 55a62a27c9
85 changed files with 1750 additions and 1807 deletions
--- a/tools/gen_trampolines.py
+++ b/tools/gen_trampolines.py
@@ -0,0 +1,248 @@
+#!/usr/bin/env -S uv run --script
+# /// script
+# requires-python = ">=3.10"
+# dependencies = ["clang==17.0.6"]
+# ///
+"""
+Generate Windows ABI trampolines by scanning C++ prototypes using libclang.
+
+This emits x86 trampolines for guest-to-host calls.
+"""
+
+if __name__ == "__main__":
+    import script_venv
+
+    script_venv.bootstrap_venv(__file__)
+
+import argparse
+import os
+import sys
+import tempfile
+
+from clang.cindex import (
+    Config,
+    Cursor,
+    CursorKind,
+    Index,
+    TranslationUnit,
+)
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Iterable, List, Optional
+
+# Allow libclang path to be specified via environment variable
+if "LIBCLANG_PATH" in os.environ:
+    libclang_path = os.environ["LIBCLANG_PATH"]
+    if os.path.isfile(libclang_path):
+        Config.set_library_file(libclang_path)
+    elif os.path.isdir(libclang_path):
+        Config.set_library_path(libclang_path)
+    else:
+        sys.stderr.write(
+            f"Warning: LIBCLANG_PATH={libclang_path} is not a file or directory\n"
+        )
+
+
+@dataclass
+class FuncInfo:
+    qualified_ns: str
+    name: str
+    mangled: str
+    argc: int
+    stdcall: bool
+
+
+def parse_tu(
+    headers: List[str], include_dirs: List[str], target: str
+) -> TranslationUnit:
+    # Construct a tiny TU that includes the requested headers
+    tu_source = "\n".join([f'#include "{h}"' for h in headers]) + "\n"
+    with tempfile.NamedTemporaryFile("w", suffix=".cpp") as tf:
+        tf.write(tu_source)
+        tf.flush()
+        args = [
+            "-x",
+            "c++",
+            "-std=c++17",
+            "-target",
+            target,
+            "-DWIBO_CODEGEN=1",
+        ] + [arg for inc in include_dirs for arg in ("-I", inc)]
+
+        index = Index.create()
+        tu = index.parse(
+            tf.name, args=args, options=TranslationUnit.PARSE_SKIP_FUNCTION_BODIES
+        )
+        for d in tu.diagnostics:
+            if d.severity >= d.Warning:
+                sys.stderr.write(str(d) + "\n")
+        return tu
+
+
+def _cursor_namespace(cursor: Cursor) -> List[str]:
+    ns: List[str] = []
+    c = cursor
+    while c is not None and c.kind != CursorKind.TRANSLATION_UNIT:
+        if c.kind == CursorKind.NAMESPACE and c.spelling:
+            ns.append(c.spelling)
+        c = c.semantic_parent
+    return list(reversed(ns))
+
+
+def _has_stdcall_annotation(func: Cursor) -> bool:
+    for child in func.get_children():
+        if child.kind == CursorKind.ANNOTATE_ATTR and child.spelling == "CC:stdcall":
+            return True
+    return False
+
+
+def _arg_count(func: Cursor) -> int:
+    return sum(1 for _ in func.type.argument_types())
+
+
+def collect_functions(tu: TranslationUnit, ns_filter: Optional[str]) -> List[FuncInfo]:
+    want_ns = ns_filter.split("::") if ns_filter else None
+    out: dict[str, FuncInfo] = {}
+
+    def visit(node: Cursor) -> None:
+        if node.kind == CursorKind.FUNCTION_DECL:
+            ns_parts = _cursor_namespace(node)
+            if want_ns is not None and ns_parts != want_ns:
+                return
+            name = node.spelling or ""
+            mangled = getattr(node, "mangled_name", None) or ""
+            if not name or not mangled:
+                return
+            out[name] = FuncInfo(
+                qualified_ns="::".join(ns_parts),
+                name=name,
+                mangled=mangled,
+                argc=_arg_count(node),
+                stdcall=_has_stdcall_annotation(node),
+            )
+        # Recurse into children where it makes sense
+        if node.kind in (CursorKind.TRANSLATION_UNIT, CursorKind.NAMESPACE):
+            for c in node.get_children():
+                visit(c)
+
+    visit(tu.cursor)
+    return sorted(out.values(), key=lambda f: f.name)
+
+
+def emit_x86_asm_trampolines(dll: str, funcs: Iterable[FuncInfo]) -> str:
+    lines: List[str] = []
+    lines.append("#\tAuto-generated trampolines; DO NOT EDIT.")
+    lines.append(".section .note.GNU-stack, \"\", @progbits")
+    lines.append(".text")
+    for f in funcs:
+        name = f.name
+        mangled = f.mangled
+        # Ensure ms_abi is encoded for stdcall function-pointer types to match GCC
+        # mangled = mangled.replace("U7stdcall", "U7stdcallU6ms_abi")
+        tramp = f"thunk_{dll}_{name}"
+        lines.append("")
+        lines.append(f".globl {tramp}")
+        lines.append(f".type {tramp}, @function")
+        lines.append(f"{tramp}:")
+        argc = int(f.argc or 0)
+        # Calculate number of stack args (fastcall uses ECX/EDX for first 2)
+        stack_argc = max(0, argc - 2)
+        stack_bytes = stack_argc * 4
+        # Use frame pointer for clean alignment and argument access
+        lines.append("\tpush %ebp")
+        lines.append("\tmovl %esp, %ebp")
+        # Align stack: we want ESP = 16n before the call,
+        # so that after call pushes return address, callee sees ESP = 16n - 4
+        # After pushing stack_bytes worth of args, we need ESP = 16n + stack_bytes
+        if stack_bytes > 0:
+            lines.append(f"\tleal -{stack_bytes}(%ebp), %esp")
+            lines.append("\tandl $0xFFFFFFF0, %esp")
+            lines.append(f"\taddl ${stack_bytes}, %esp")
+        else:
+            # No stack args, just align to 16n for the call
+            lines.append("\tandl $0xFFFFFFF0, %esp")
+        # Move first two args into ECX/EDX for fastcall
+        if argc >= 1:
+            lines.append("\tmovl 8(%ebp), %ecx")
+        if argc >= 2:
+            lines.append("\tmovl 12(%ebp), %edx")
+        # Push remaining args (from last down to the 3rd) so layout matches fastcall
+        for i in range(argc, 2, -1):
+            off = 4 * (i + 1)  # +1 because EBP offset includes pushed EBP
+            lines.append(f"\tpushl {off}(%ebp)")
+        # Call into fastcall stub
+        lines.append(f"\tcall {mangled}")
+        # Restore stack and frame pointer
+        lines.append("\tleave")
+        # Return to guest
+        argb = argc * 4
+        if f.stdcall and argb:
+            lines.append(f"\tret ${argb}")
+        else:
+            lines.append("\tret")
+        lines.append(f".size {tramp}, . - {tramp}")
+    return "\n".join(lines) + "\n"
+
+
+def emit_header_mapping(dll: str, funcs: Iterable[FuncInfo]) -> str:
+    guard = f"WIBO_GEN_{dll.upper()}_TRAMPOLINES_H"
+    lines: List[str] = []
+    lines.append("/* Auto-generated; DO NOT EDIT. */")
+    lines.append(f"#ifndef {guard}")
+    lines.append(f"#define {guard}")
+    lines.append("#include <stddef.h>")
+    lines.append("#include <string.h>")
+    lines.append('#ifdef __cplusplus\nextern "C" {\n#endif')
+    for f in funcs:
+        tramp = f"thunk_{dll}_{f.name}"
+        lines.append(f"void {tramp}(void);")
+    lines.append("#ifdef __cplusplus\n}\n#endif")
+    lines.append("")
+    # name->address helper for resolveByName
+    lines.append("static inline void *%s_trampoline_by_name(const char *name) {" % dll)
+    for f in funcs:
+        lines.append(
+            f'\tif (strcmp(name, "{f.name}") == 0) return (void*)&thunk_{dll}_{f.name};'
+        )
+    lines.append("\treturn NULL;")
+    lines.append("}")
+    lines.append(f"#endif /* {guard} */\n")
+    return "\n".join(lines)
+
+
+def main() -> int:
+    ap = argparse.ArgumentParser()
+    ap.add_argument("--dll", required=True, help="DLL name, e.g. kernel32")
+    ap.add_argument("--headers", nargs="+", required=True, help="Header files to scan")
+    ap.add_argument(
+        "--namespace", dest="ns", default=None, help="Namespace filter, e.g. kernel32"
+    )
+    ap.add_argument("--arch", choices=["x86"], default="x86")
+    ap.add_argument(
+        "--out-asm", type=Path, required=True, help="Output assembly file (.S)"
+    )
+    ap.add_argument(
+        "--out-hdr", type=Path, required=True, help="Output header file (.h)"
+    )
+    ap.add_argument("-I", dest="incs", action="append", default=[])
+    args = ap.parse_args()
+
+    target = "i686-pc-linux-gnu" if args.arch == "x86" else "x86_64-pc-linux-gnu"
+    tu = parse_tu(args.headers, args.incs, target)
+    funcs = collect_functions(tu, args.ns)
+    if not funcs:
+        sys.stderr.write("No functions found for generation.\n")
+        return 1
+
+    asm = emit_x86_asm_trampolines(args.dll, funcs)
+    hdr = emit_header_mapping(args.dll, funcs)
+
+    args.out_asm.parent.mkdir(parents=True, exist_ok=True)
+    args.out_hdr.parent.mkdir(parents=True, exist_ok=True)
+    args.out_asm.write_text(asm)
+    args.out_hdr.write_text(hdr)
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
--- a/tools/script_venv.py
+++ b/tools/script_venv.py
@@ -0,0 +1,236 @@
+#!/usr/bin/env python3
+"""
+Reusable venv management for PEP 723 inline script dependencies.
+
+This module provides utilities to:
+1. Parse PEP 723 inline script metadata blocks
+2. Create and manage virtual environments
+3. Track dependencies and reinstall when they change
+"""
+
+import hashlib
+import json
+import os
+import re
+import subprocess
+import sys
+import venv
+from pathlib import Path
+
+
+SCRIPT_BLOCK_RE = re.compile(r"(?m)^# /// script$\s(?P<content>(^#(| .*)$\s)+)^# ///$")
+
+
+def _load_toml(text: str) -> dict:
+    """Load TOML using stdlib tomllib or third-party tomli as a fallback."""
+    try:
+        import tomllib  # type: ignore[attr-defined]
+    except Exception:
+        try:
+            import tomli as tomllib  # type: ignore[no-redef]
+        except Exception as exc:  # pragma: no cover - import error path
+            raise SystemExit(
+                "Missing TOML parser. Install 'tomli' or use Python >= 3.11."
+            ) from exc
+    return tomllib.loads(text)
+
+
+def read_pep723_metadata(script_path: Path) -> dict:
+    """
+    Parse PEP 723 inline script metadata from a Python file.
+
+    Returns the parsed TOML data as a dict, or empty dict if no block found.
+    """
+    text = script_path.read_text(encoding="utf-8")
+    m = SCRIPT_BLOCK_RE.search(text)
+    if not m:
+        return {}
+    content = m.group("content")
+    toml_lines: list[str] = []
+    for line in content.splitlines():
+        if not line.startswith("#"):
+            continue
+        # Strip the leading comment marker and a single optional space
+        if line.startswith("# "):
+            toml_lines.append(line[2:])
+        else:
+            toml_lines.append(line[1:])
+
+    toml_text = "\n".join(toml_lines)
+    return _load_toml(toml_text)
+
+
+def deps_digest(deps: list[str]) -> str:
+    """Compute a stable hash of the dependency list."""
+    return hashlib.sha256(json.dumps(sorted(deps)).encode()).hexdigest()
+
+
+def in_venv() -> bool:
+    """
+    Check if we're currently running inside a virtual environment.
+    """
+    return sys.prefix != sys.base_prefix
+
+
+def _parse_version_tuple(v: str) -> tuple[int, int, int]:
+    """Parse a version like '3.12.1' into a 3-tuple, ignoring any suffixes."""
+    parts = re.findall(r"\d+", v)
+    nums = [int(p) for p in parts[:3]]
+    while len(nums) < 3:
+        nums.append(0)
+    return tuple(nums)  # type: ignore[return-value]
+
+
+def _satisfies_requires_python(
+    spec: str, current: tuple[int, int, int] | None = None
+) -> bool:
+    """
+    Minimal evaluator for PEP 440-like specifiers in requires-python.
+
+    Supports common operators: >=, >, <=, <, ==, != and wildcard '==3.12.*'.
+    Combines multiple comma-separated specifiers with logical AND.
+    """
+    cur = current or (
+        sys.version_info.major,
+        sys.version_info.minor,
+        sys.version_info.micro,
+    )
+
+    def cmp(a: tuple[int, int, int], b: tuple[int, int, int]) -> int:
+        return (a > b) - (a < b)
+
+    for raw in spec.split(","):
+        s = raw.strip()
+        if not s:
+            continue
+        op = None
+        for candidate in (">=", "<=", "==", "!=", ">", "<"):
+            if s.startswith(candidate):
+                op = candidate
+                ver = s[len(candidate) :].strip()
+                break
+        if op is None:
+            # Treat bare version as ==version (prefix match compatible with '==3.12.*')
+            op, ver = "==", s
+        wildcard = op in {"==", "!="} and ver.endswith(".*")
+        if wildcard:
+            ver = ver[:-2]
+        tgt = _parse_version_tuple(ver)
+        c = cmp(cur, tgt)
+        if op == ">=":
+            if c < 0:
+                return False
+        elif op == ">":
+            if c <= 0:
+                return False
+        elif op == "<=":
+            if c > 0:
+                return False
+        elif op == "<":
+            if c >= 0:
+                return False
+        elif op == "==":
+            if wildcard:
+                # Prefix equality: compare only provided components
+                prefix = _parse_version_tuple(ver)  # already trimmed
+                plen = 2 if ver.count(".") == 1 else 3
+                if tuple(cur[:plen]) != tuple(prefix[:plen]):
+                    return False
+            else:
+                if c != 0:
+                    return False
+        elif op == "!=":
+            if wildcard:
+                prefix = _parse_version_tuple(ver)
+                plen = 2 if ver.count(".") == 1 else 3
+                if tuple(cur[:plen]) == tuple(prefix[:plen]):
+                    return False
+            else:
+                if c == 0:
+                    return False
+        else:
+            return False
+    return True
+
+
+def is_venv_managed(venv_dir: Path) -> bool:
+    """Check if a venv was created by this script manager."""
+    marker = venv_dir / ".script-managed"
+    return marker.exists()
+
+
+def get_venv_digest(venv_dir: Path) -> str | None:
+    """Get the stored dependency digest from a managed venv."""
+    marker = venv_dir / ".script-managed"
+    if not marker.exists():
+        return None
+    return marker.read_text().strip()
+
+
+def set_venv_digest(venv_dir: Path, digest: str) -> None:
+    """Store the dependency digest in a managed venv."""
+    marker = venv_dir / ".script-managed"
+    marker.write_text(digest)
+
+
+def create_venv(venv_dir: Path) -> Path:
+    """Create a new virtual environment and return the path to its Python binary."""
+    python_bin = venv_dir / ("Scripts/python.exe" if os.name == "nt" else "bin/python")
+    if not python_bin.exists():
+        venv.create(venv_dir, with_pip=True)
+    return python_bin
+
+
+def install_deps(python_bin: Path, deps: list[str]) -> None:
+    """Install dependencies into a virtual environment."""
+    if not deps:
+        return
+    subprocess.check_call([str(python_bin), "-m", "pip", "install", *deps])
+
+
+def bootstrap_venv(script_file: str) -> None:
+    """
+    Bootstrap the script with its venv if not already running in one.
+
+    If script_path is None, uses __file__ from the calling context.
+    This function will re-exec the script with the venv's Python if needed.
+    """
+    # Allow users to opt out entirely
+    if os.environ.get("AUTOVENV", "1").lower() in {"0", "false", "no"}:
+        return
+
+    script_path = Path(script_file).resolve()
+
+    # Read PEP 723 metadata
+    meta = read_pep723_metadata(script_path)
+    # Enforce requires-python if declared
+    requires = meta.get("requires-python")
+    if isinstance(requires, str) and not _satisfies_requires_python(requires):
+        msg = (
+            f"Python {sys.version_info.major}.{sys.version_info.minor}.{sys.version_info.micro} "
+            f"does not satisfy requires-python: {requires}"
+        )
+        raise SystemExit(msg)
+    deps = meta.get("dependencies", [])
+    current_digest = deps_digest(deps)
+
+    if in_venv():
+        # Already in a venv, use it
+        venv_dir = Path(sys.prefix)
+        python_bin = Path(sys.executable)
+        managed = is_venv_managed(venv_dir)
+    else:
+        # Create a new managed venv
+        venv_dir = script_path.parent / ".venv"
+        python_bin = create_venv(venv_dir)
+        managed = True
+
+    stored_digest = get_venv_digest(venv_dir)
+    if managed and stored_digest != current_digest:
+        # Managed venv and deps changed, reinstall
+        install_deps(python_bin, deps)
+        set_venv_digest(venv_dir, current_digest)
+
+    if venv_dir != Path(sys.prefix):
+        # Re-exec with venv Python
+        os.execv(str(python_bin), [str(python_bin), str(script_path), *sys.argv[1:]])