mirror of
https://github.com/elicpeter/nyx.git
synced 2026-06-09 19:45:13 +02:00
* feat: Enhance data exfiltration detection with source sensitivity gating for cookies and headers * feat: Implement cross-file data exfiltration detection with parameter-specific gate filters * feat: Add calibration tests and refine DATA_EXFIL severity scoring logic * feat: Introduce per-detector configuration for data exfiltration suppression * feat: Enhance DATA_EXFIL findings with destination field tracking in diagnostics and SARIF output * feat: Add tainted body and URL handling for data exfiltration detection * feat: Add integration tests and fixtures for DATA_EXFIL and SSRF detection in Go * feat: Add Java integration tests and fixtures for DATA_EXFIL detection across multiple HTTP clients * feat: Add synthetic externals handling for closure-captured variables in SSA * feat: Implement closure-based suppression for resource leak findings * feat: Add regression guards for shell-injection and taint propagation in for-of destructure patterns * feat: Implement constructor cap narrowing for data exfiltration detection in HTTP request builders * feat: Add gated sinks for data exfiltration detection in C and C++ using curl_easy_setopt * feat: Implement DATA_EXFIL cap parity for backwards analysis and add integration tests * feat: Add data exfiltration sinks for various languages and enhance documentation * refactor: Simplify formatting and improve readability in various files * refactor: Improve readability by simplifying conditional statements and adding clippy linting * docs: Update CHANGELOG and comments for data exfiltration features and configuration * docs: Clarify configuration instructions for data exfiltration trusted destinations * docs: Enhance comments for evidence routing logic in data exfiltration
282 lines
10 KiB
Rust
282 lines
10 KiB
Rust
use crate::labels::{
|
|
Cap, DataLabel, GateActivation, Kind, LabelRule, ParamConfig, RuntimeLabelRule, SinkGate,
|
|
};
|
|
use crate::utils::project::{DetectedFramework, FrameworkContext};
|
|
use phf::{Map, phf_map};
|
|
|
|
pub static RULES: &[LabelRule] = &[
|
|
// ─────────── Sources ───────────
|
|
// Note: PHP `$` prefix is stripped by collect_idents, so match without `$`.
|
|
LabelRule {
|
|
matchers: &[
|
|
"$_GET",
|
|
"_GET",
|
|
"$_POST",
|
|
"_POST",
|
|
"$_REQUEST",
|
|
"_REQUEST",
|
|
"$_COOKIE",
|
|
"_COOKIE",
|
|
"$_FILES",
|
|
"_FILES",
|
|
"$_SERVER",
|
|
"_SERVER",
|
|
"$_ENV",
|
|
"_ENV",
|
|
],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["file_get_contents", "fread"],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
// ───────── Sanitizers ──────────
|
|
LabelRule {
|
|
matchers: &["htmlspecialchars", "htmlentities"],
|
|
label: DataLabel::Sanitizer(Cap::HTML_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["escapeshellarg", "escapeshellcmd"],
|
|
label: DataLabel::Sanitizer(Cap::SHELL_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["basename", "realpath"],
|
|
label: DataLabel::Sanitizer(Cap::FILE_IO),
|
|
case_sensitive: false,
|
|
},
|
|
// PDO parameterized queries
|
|
LabelRule {
|
|
matchers: &["prepare", "bindParam", "bindValue"],
|
|
label: DataLabel::Sanitizer(Cap::SQL_QUERY),
|
|
case_sensitive: false,
|
|
},
|
|
// Type-check sanitizers
|
|
LabelRule {
|
|
matchers: &["intval", "floatval", "ctype_digit", "ctype_alpha"],
|
|
label: DataLabel::Sanitizer(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
// PHP input filtering
|
|
LabelRule {
|
|
matchers: &["filter_input", "filter_var"],
|
|
label: DataLabel::Sanitizer(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["urlencode", "rawurlencode"],
|
|
label: DataLabel::Sanitizer(Cap::URL_ENCODE),
|
|
case_sensitive: false,
|
|
},
|
|
// ─────────── Sinks ─────────────
|
|
LabelRule {
|
|
matchers: &[
|
|
"system",
|
|
"exec",
|
|
"passthru",
|
|
"shell_exec",
|
|
"proc_open",
|
|
"popen",
|
|
],
|
|
label: DataLabel::Sink(Cap::SHELL_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["eval", "assert"],
|
|
label: DataLabel::Sink(Cap::CODE_EXEC),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["include", "include_once", "require", "require_once"],
|
|
label: DataLabel::Sink(Cap::FILE_IO),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["unserialize"],
|
|
label: DataLabel::Sink(Cap::DESERIALIZE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["move_uploaded_file", "copy", "file_put_contents", "fwrite"],
|
|
label: DataLabel::Sink(Cap::FILE_IO),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["echo", "print"],
|
|
label: DataLabel::Sink(Cap::HTML_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["mysqli_query", "pg_query", "pg_execute", "query"],
|
|
label: DataLabel::Sink(Cap::SQL_QUERY),
|
|
case_sensitive: false,
|
|
},
|
|
// PDO and MySQLi OOP: exec/prepare+execute patterns.
|
|
LabelRule {
|
|
matchers: &[
|
|
"pdo.exec",
|
|
"pdo.query",
|
|
"mysqli.real_query",
|
|
"mysqli_real_query",
|
|
],
|
|
label: DataLabel::Sink(Cap::SQL_QUERY),
|
|
case_sensitive: false,
|
|
},
|
|
// Laravel Eloquent: raw SQL methods.
|
|
// DB::raw() → scoped_call_expression, callee text "DB.raw".
|
|
// whereRaw/selectRaw/orderByRaw/havingRaw → member_call_expression on query builder.
|
|
LabelRule {
|
|
matchers: &["DB.raw", "whereRaw", "selectRaw", "orderByRaw", "havingRaw"],
|
|
label: DataLabel::Sink(Cap::SQL_QUERY),
|
|
case_sensitive: false,
|
|
},
|
|
// NOTE: `file_get_contents` can fetch URLs (SSRF vector) and local files (LFI vector).
|
|
// As a Sink(SSRF) it only fires when the argument is tainted.
|
|
LabelRule {
|
|
matchers: &["file_get_contents", "curl_exec"],
|
|
label: DataLabel::Sink(Cap::SSRF),
|
|
case_sensitive: false,
|
|
},
|
|
// ── Cross-boundary data exfiltration ──────────────────────────────────
|
|
//
|
|
// Body-bearing outbound HTTP verb methods on the major PHP HTTP clients.
|
|
// Flat sinks here compose with the SSRF rule on `curl_exec` /
|
|
// `file_get_contents` via multi-label classification. The
|
|
// source-sensitivity gate in `effective_sink_caps` strips DATA_EXFIL
|
|
// when the contributing source is `Plain` (`$_GET`, `$_POST`, `$_REQUEST`),
|
|
// so this only fires for sensitive sources (cookies / sessions /
|
|
// server-side state / env / file / db reads).
|
|
//
|
|
// Covered clients:
|
|
// * `Guzzle\Client::post/put/patch` — guzzlehttp/guzzle
|
|
// matched by suffix on the verb method (chained `$client->post(...)`).
|
|
// * `Symfony\HttpClient::request` — symfony/http-client
|
|
// request($method, $url, ['body' => $payload, 'json' => $data, ...])
|
|
// * `Http::post` — Laravel HTTP facade (over Guzzle)
|
|
LabelRule {
|
|
matchers: &[
|
|
"Client.post",
|
|
"Client.put",
|
|
"Client.patch",
|
|
"Client.request",
|
|
"HttpClient.post",
|
|
"HttpClient.put",
|
|
"HttpClient.patch",
|
|
"HttpClient.request",
|
|
"Http.post",
|
|
"Http.put",
|
|
"Http.patch",
|
|
],
|
|
label: DataLabel::Sink(Cap::DATA_EXFIL),
|
|
case_sensitive: true,
|
|
},
|
|
];
|
|
|
|
/// Gated sinks for PHP.
|
|
///
|
|
/// `curl_setopt($ch, CURLOPT_POSTFIELDS, $payload)` is the canonical
|
|
/// non-OO PHP HTTP-egress payload binding. The activation arg (index 1) is
|
|
/// a `define`d constant: `CURLOPT_POSTFIELDS` (and the byref-copying variant
|
|
/// `CURLOPT_COPYPOSTFIELDS`) carry the request body, while other CURLOPT_*
|
|
/// constants designate URL / auth / TLS / behaviour, none of which is
|
|
/// DATA_EXFIL-relevant. Gating on the constant identifier keeps the rule
|
|
/// from over-firing on `curl_setopt($ch, CURLOPT_URL, $url)` (covered
|
|
/// elsewhere by the `curl_exec` SSRF flat sink).
|
|
///
|
|
/// Identifier-based activation is enabled via the macro-arg fallback in
|
|
/// `cfg::mod::classify_gated_sink` for `lang == "php"`.
|
|
pub static GATED_SINKS: &[SinkGate] = &[SinkGate {
|
|
callee_matcher: "curl_setopt",
|
|
arg_index: 1,
|
|
dangerous_values: &["CURLOPT_POSTFIELDS", "CURLOPT_COPYPOSTFIELDS"],
|
|
dangerous_prefixes: &[],
|
|
label: DataLabel::Sink(Cap::DATA_EXFIL),
|
|
case_sensitive: true,
|
|
payload_args: &[2],
|
|
keyword_name: None,
|
|
dangerous_kwargs: &[],
|
|
activation: GateActivation::ValueMatch,
|
|
}];
|
|
|
|
pub static KINDS: Map<&'static str, Kind> = phf_map! {
|
|
// control-flow
|
|
"if_statement" => Kind::If,
|
|
"while_statement" => Kind::While,
|
|
"for_statement" => Kind::For,
|
|
"foreach_statement" => Kind::For,
|
|
"do_statement" => Kind::While,
|
|
|
|
"return_statement" => Kind::Return,
|
|
"throw_expression" => Kind::Throw,
|
|
"break_statement" => Kind::Break,
|
|
"continue_statement" => Kind::Continue,
|
|
|
|
// structure
|
|
"program" => Kind::SourceFile,
|
|
"compound_statement" => Kind::Block,
|
|
"else_clause" => Kind::Block,
|
|
"else_if_clause" => Kind::Block,
|
|
"function_definition" => Kind::Function,
|
|
"method_declaration" => Kind::Function,
|
|
"switch_statement" => Kind::Switch,
|
|
"switch_block" => Kind::Block,
|
|
"case_statement" => Kind::Block,
|
|
"default_statement" => Kind::Block,
|
|
"try_statement" => Kind::Try,
|
|
"catch_clause" => Kind::Block,
|
|
"finally_clause" => Kind::Block,
|
|
"colon_block" => Kind::Block,
|
|
"anonymous_function_creation_expression" => Kind::Function,
|
|
"arrow_function" => Kind::Function,
|
|
"class_declaration" => Kind::Block,
|
|
|
|
// data-flow
|
|
"function_call_expression" => Kind::CallFn,
|
|
"object_creation_expression" => Kind::CallFn,
|
|
"member_call_expression" => Kind::CallMethod,
|
|
"scoped_call_expression" => Kind::CallMethod,
|
|
"assignment_expression" => Kind::Assignment,
|
|
"expression_statement" => Kind::CallWrapper,
|
|
"echo_statement" => Kind::CallWrapper,
|
|
|
|
// trivia
|
|
"comment" => Kind::Trivia,
|
|
";" => Kind::Trivia, "," => Kind::Trivia,
|
|
"(" => Kind::Trivia, ")" => Kind::Trivia,
|
|
"{" => Kind::Trivia, "}" => Kind::Trivia,
|
|
"\n" => Kind::Trivia,
|
|
"php_tag" => Kind::Trivia,
|
|
"namespace_definition" => Kind::Trivia,
|
|
"namespace_use_declaration" => Kind::Trivia,
|
|
};
|
|
|
|
pub static PARAM_CONFIG: ParamConfig = ParamConfig {
|
|
params_field: "parameters",
|
|
param_node_kinds: &["simple_parameter", "variadic_parameter"],
|
|
self_param_kinds: &[],
|
|
ident_fields: &["name"],
|
|
};
|
|
|
|
/// Framework-conditional rules for PHP.
|
|
pub fn framework_rules(ctx: &FrameworkContext) -> Vec<RuntimeLabelRule> {
|
|
let mut rules = Vec::new();
|
|
|
|
if ctx.has(DetectedFramework::Laravel) {
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec![
|
|
"Request::input".into(),
|
|
"Request::get".into(),
|
|
"Request::query".into(),
|
|
"Request::post".into(),
|
|
"Request::all".into(),
|
|
],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: false,
|
|
});
|
|
}
|
|
|
|
rules
|
|
}
|