2026-03-23 18:31:11 +01:00
|
|
|
[package]
|
2026-04-11 00:10:38 -04:00
|
|
|
name = "noxa-core"
|
2026-03-23 18:31:11 +01:00
|
|
|
description = "Pure HTML content extraction engine for LLMs"
|
|
|
|
|
version.workspace = true
|
|
|
|
|
edition.workspace = true
|
|
|
|
|
license.workspace = true
|
|
|
|
|
|
2026-03-26 10:28:16 +01:00
|
|
|
[features]
|
|
|
|
|
default = ["quickjs"]
|
|
|
|
|
quickjs = ["rquickjs"]
|
|
|
|
|
|
2026-03-23 18:31:11 +01:00
|
|
|
[dependencies]
|
|
|
|
|
serde = { workspace = true }
|
|
|
|
|
serde_json = { workspace = true }
|
|
|
|
|
thiserror = { workspace = true }
|
|
|
|
|
tracing = { workspace = true }
|
|
|
|
|
scraper = "0.22"
|
|
|
|
|
ego-tree = "0.10"
|
|
|
|
|
url = { version = "2", features = ["serde"] }
|
|
|
|
|
regex = "1"
|
|
|
|
|
once_cell = "1"
|
|
|
|
|
similar = "2"
|
2026-03-26 10:28:16 +01:00
|
|
|
rquickjs = { version = "0.9", features = ["classes", "properties"], optional = true }
|
2026-03-23 18:31:11 +01:00
|
|
|
|
|
|
|
|
[dev-dependencies]
|
|
|
|
|
tokio = { workspace = true }
|