From 3bcb288d13ff8e39a043ce760b44b23e762f0623 Mon Sep 17 00:00:00 2001 From: Valerio <88933932+0xMassi@users.noreply.github.com> Date: Tue, 12 May 2026 11:46:33 +0200 Subject: [PATCH] fix(fetch): guard challenge detection before utf8 decoding --- crates/webclaw-fetch/src/client.rs | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/crates/webclaw-fetch/src/client.rs b/crates/webclaw-fetch/src/client.rs index 4fff454..810c450 100644 --- a/crates/webclaw-fetch/src/client.rs +++ b/crates/webclaw-fetch/src/client.rs @@ -783,6 +783,10 @@ fn is_pdf_content_type(headers: &http::HeaderMap) -> bool { /// Detect if a response looks like a bot protection challenge page. fn is_challenge_response(response: &Response) -> bool { + let body_len = response.body().len(); + if body_len > 15_000 || body_len == 0 { + return false; + } is_challenge_html(response.text().as_ref()) }