Initial release: webclaw v0.1.0 — web content extraction for LLMs

CLI + MCP server for extracting clean, structured content from any URL.
6 Rust crates, 10 MCP tools, TLS fingerprinting, 5 output formats.

MIT Licensed | https://webclaw.io
This commit is contained in:
Valerio 2026-03-23 18:31:11 +01:00
commit c99ec684fa
79 changed files with 24074 additions and 0 deletions

View file

@ -0,0 +1,15 @@
/// Extraction errors — kept minimal since this crate does no I/O.
/// Most failures come from malformed HTML or invalid URLs.
use thiserror::Error;
#[derive(Debug, Error)]
pub enum ExtractError {
#[error("failed to parse HTML")]
ParseError,
#[error("invalid URL: {0}")]
InvalidUrl(String),
#[error("no content found")]
NoContent,
}