mirror of
https://github.com/feder-cr/invisible_playwright.git
synced 2026-06-10 08:45:13 +02:00
windows-latest headless kept flaking on special-scheme pages: data: URLs get re-normalized (re-nav), about:blank + redundant goto destroys the context, and both can carry a CSP that blocks eval(). Serve the test page over a real http://127.0.0.1 instead — none of those quirks, and it adds real-navigation coverage (await a response). Evaluates stay arrow-functions (no eval), listeners are inline-script (no on* attrs), and transient context-destroyed/detached/timeout gets up to 2 retries. A genuinely broken binary fails all 3 attempts.
173 lines
8.2 KiB
Python
173 lines
8.2 KiB
Python
#!/usr/bin/env python3
|
|
"""CI drive gate — the firefox-N catcher.
|
|
|
|
A raw `firefox --screenshot` proves nothing about automation: a juggler-less
|
|
binary renders a screenshot just fine and ships broken (firefox-8 did exactly
|
|
that). This DRIVES the binary the way users will — Playwright launches it over
|
|
the juggler pipe and exercises the input/DOM paths real callers depend on.
|
|
|
|
It deliberately covers the failure modes that HISTORICALLY shipped green:
|
|
- juggler missing entirely → TargetClosedError on launch (firefox-8)
|
|
- mouse/keyboard input broken → click/move/type assertions (firefox-2 #9:
|
|
jugglerSendMouseEvent / synthesizeMouseEvent)
|
|
- canvas non-deterministic → identical draw → identical dataURL (stealth
|
|
seed must be per-session, not per-readback)
|
|
- headless navigator tells → navigator.webdriver falsy, languages
|
|
non-empty, plugins is a real PluginArray
|
|
- real HTTP navigation broken → the page is served over http://127.0.0.1
|
|
and a `response` is awaited (not data:/about:blank)
|
|
|
|
All of this is headless, NO screenshot → GPU-free (can't false-fail on the
|
|
GPU-less hosted runners). The HTTP server is loopback-only → no external network,
|
|
no proxy, no secrets → safe in public CI. WebGL determinism is intentionally NOT
|
|
checked here (needs SWGL, false-fails headless); it lives in the local realness
|
|
gate, along with the faithful cross-origin iframe test (issue #20 — a same-origin
|
|
in-gate iframe is a weak proxy AND races Juggler's frame tracking).
|
|
|
|
Robustness (learned the hard way, across many runner round-trips):
|
|
- The page is served over real `http://127.0.0.1:<port>/`. A `data:` URL gets
|
|
re-normalized (re-navigated) by Firefox, `about:blank` + a redundant goto
|
|
intermittently "destroys the execution context by navigation", and both can
|
|
carry a CSP that blocks `eval()`. A plain loopback HTTP page has none of that.
|
|
- Every `page.evaluate` is an ARROW FUNCTION (Playwright callFunction, never
|
|
eval'd) — immune to a page CSP that blocks eval. Listeners are wired in an
|
|
inline <script> on the served page, not via inline on* attributes.
|
|
- Transient "context destroyed / detached / target closed" gets up to 2 logged
|
|
retries (the windows-latest headless runner is interaction-flaky); a
|
|
genuinely broken binary fails ALL attempts → the gate fails.
|
|
|
|
Usage: python ci_drive_gate.py /path/to/firefox[.exe | .app/Contents/MacOS/firefox]
|
|
Exit 0 + "DRIVE GATE OK ..." on success; non-zero with a reason on failure.
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
import http.server
|
|
import socketserver
|
|
import sys
|
|
import threading
|
|
|
|
# Full page served over loopback http. Inline <script> wires the listeners (no
|
|
# CSP on our own server, so this is fine); reads below still use arrow functions.
|
|
HTML = (
|
|
"<!doctype html><html><head><title>dt</title></head><body>"
|
|
"<h1 id=x>hello-drive</h1>"
|
|
"<button id=b>go</button>"
|
|
"<input id=inp>"
|
|
"<script>"
|
|
"window.__clicked=0;window.__moves=0;"
|
|
"document.getElementById('b').addEventListener('click',function(){window.__clicked=1;});"
|
|
"window.addEventListener('mousemove',function(){window.__moves++;});"
|
|
"</script>"
|
|
"</body></html>"
|
|
).encode()
|
|
|
|
# Identical 2D draw, evaluated twice in one session. The stealth canvas spoof is
|
|
# seeded per-session (see fingerprint-consistency rule), so two identical draws
|
|
# MUST produce byte-identical output. Per-readback noise → instant bot flag.
|
|
CANVAS_DRAW = (
|
|
"() => {const c=document.createElement('canvas');c.width=c.height=16;"
|
|
"const g=c.getContext('2d');g.fillStyle='#08f';g.fillRect(0,0,16,16);"
|
|
"g.fillStyle='#f40';g.fillText('s',2,12);return c.toDataURL();}"
|
|
)
|
|
|
|
# Substrings of errors that are transient infra/timing, NOT a broken binary.
|
|
_TRANSIENT = ("context was destroyed", "frame was detached", "target closed",
|
|
"because of a navigation", "timeout")
|
|
|
|
|
|
class _Handler(http.server.BaseHTTPRequestHandler):
|
|
def do_GET(self): # noqa: N802
|
|
self.send_response(200)
|
|
self.send_header("Content-Type", "text/html; charset=utf-8")
|
|
self.send_header("Content-Length", str(len(HTML)))
|
|
self.end_headers()
|
|
self.wfile.write(HTML)
|
|
|
|
def log_message(self, *a): # silence the per-request stderr noise
|
|
pass
|
|
|
|
|
|
def _start_server():
|
|
srv = socketserver.TCPServer(("127.0.0.1", 0), _Handler)
|
|
threading.Thread(target=srv.serve_forever, daemon=True).start()
|
|
return srv, srv.server_address[1]
|
|
|
|
|
|
def _drive(exe: str, url: str) -> str:
|
|
"""One full drive attempt. Returns the UA on success; raises on failure."""
|
|
from playwright.sync_api import sync_playwright
|
|
|
|
with sync_playwright() as p:
|
|
browser = p.firefox.launch(executable_path=exe, headless=True)
|
|
try:
|
|
page = browser.new_page()
|
|
resp = page.goto(url, wait_until="load")
|
|
assert resp and resp.ok, f"navigation to {url} failed: {resp.status if resp else 'no response'}"
|
|
|
|
ua = page.evaluate("() => navigator.userAgent")
|
|
webdriver = page.evaluate("() => navigator.webdriver")
|
|
text = page.evaluate("() => document.getElementById('x').textContent")
|
|
|
|
# firefox-2 / issue-#9 catcher: real mouse + keyboard over juggler.
|
|
page.wait_for_selector("#b")
|
|
page.mouse.move(20, 20)
|
|
page.mouse.move(120, 90) # exercises synthesizeMouseEvent path
|
|
page.click("#b") # mousedown/up/click → listener fires
|
|
page.click("#inp")
|
|
page.keyboard.type("ok")
|
|
clicked = page.evaluate("() => window.__clicked")
|
|
moves = page.evaluate("() => window.__moves")
|
|
typed = page.evaluate("() => document.getElementById('inp').value")
|
|
|
|
# stealth-determinism catcher: identical draw → identical dataURL.
|
|
canvas_a = page.evaluate(CANVAS_DRAW)
|
|
canvas_b = page.evaluate(CANVAS_DRAW)
|
|
|
|
# BotD navigator-surface tells (proxy-free subset).
|
|
langs = page.evaluate("() => navigator.languages.length")
|
|
plugins = page.evaluate("() => navigator.plugins instanceof PluginArray")
|
|
finally:
|
|
browser.close()
|
|
|
|
assert "Firefox" in ua, f"unexpected UA (binary not driving correctly): {ua!r}"
|
|
assert text == "hello-drive", f"DOM/JS roundtrip failed: {text!r}"
|
|
assert not webdriver, f"navigator.webdriver leaked True (stealth regression): {webdriver!r}"
|
|
assert clicked == 1, "page.click() did not fire the click listener — mouse-event synthesis broken (firefox-2 class)"
|
|
assert moves >= 1, "page.mouse.move() produced no mousemove — jugglerSendMouseEvent regression"
|
|
assert typed == "ok", f"page.keyboard.type() failed: {typed!r}"
|
|
assert canvas_a == canvas_b, "canvas non-deterministic across identical draws (stealth seed broken → bot tell)"
|
|
assert langs and langs > 0, "navigator.languages empty (headless tell)"
|
|
assert plugins, "navigator.plugins is not a PluginArray (headless tell)"
|
|
return ua
|
|
|
|
|
|
def main(exe: str) -> int:
|
|
srv, port = _start_server()
|
|
url = f"http://127.0.0.1:{port}/"
|
|
last = None
|
|
try:
|
|
for attempt in (1, 2, 3):
|
|
try:
|
|
ua = _drive(exe, url)
|
|
if attempt > 1:
|
|
print(f"(note: drive succeeded on attempt {attempt} after a transient error)")
|
|
print(f"DRIVE GATE OK | UA={ua} | http+click+mousemove+keyboard+canvas-determinism+navsurface=ok")
|
|
return 0
|
|
except Exception as e: # noqa: BLE001 — gate: any failure must surface
|
|
last = e
|
|
msg = str(e).lower()
|
|
if attempt < 3 and any(t in msg for t in _TRANSIENT):
|
|
print(f"(transient error on attempt {attempt}, retrying): {e}", file=sys.stderr)
|
|
continue
|
|
break
|
|
finally:
|
|
srv.shutdown()
|
|
print(f"DRIVE GATE FAILED: {last}", file=sys.stderr)
|
|
return 1
|
|
|
|
|
|
if __name__ == "__main__":
|
|
if len(sys.argv) != 2:
|
|
print("usage: ci_drive_gate.py <path-to-firefox-binary>", file=sys.stderr)
|
|
sys.exit(2)
|
|
sys.exit(main(sys.argv[1]))
|