mirror of
https://github.com/elicpeter/nyx.git
synced 2026-06-06 19:35:13 +02:00
* refactor: Update comments for clarity and add expectations.json files for performance metrics * feat: Implement FP guard for JS/TS local-collection receivers to suppress missing ownership checks * feat: Enhance Rust parameter handling to classify local collections and prevent false ownership checks * refactor: Simplify code formatting for better readability in multiple files * refactor: Improve UTF-8 sequence length handling and enhance clarity in loop iteration * feat: Update Java and Python patterns to include new security rules * refactor: Improve comment clarity and consistency across multiple Rust files * refactor: Simplify code formatting for improved readability in integration tests and module files * refactor: Improve comment formatting and enhance clarity in assertions across multiple files
374 lines
13 KiB
Rust
374 lines
13 KiB
Rust
use crate::labels::{Cap, DataLabel, Kind, LabelRule, ParamConfig, RuntimeLabelRule};
|
|
use crate::utils::project::{DetectedFramework, FrameworkContext};
|
|
use phf::{Map, phf_map};
|
|
|
|
pub static RULES: &[LabelRule] = &[
|
|
// ─────────── Sources ───────────
|
|
LabelRule {
|
|
matchers: &["std::env::var", "env::var", "source_env"],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["source_file"],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["fs::read_to_string", "fs::read"],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: false,
|
|
},
|
|
// ───────── Sanitizers ──────────
|
|
LabelRule {
|
|
matchers: &["html_escape::encode_safe", "sanitize_", "sanitize_html"],
|
|
label: DataLabel::Sanitizer(Cap::HTML_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["shell_escape::unix::escape", "sanitize_shell"],
|
|
label: DataLabel::Sanitizer(Cap::SHELL_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
// ─────────── Sinks ─────────────
|
|
LabelRule {
|
|
matchers: &[
|
|
"command::new",
|
|
"std::process::command::new",
|
|
"command::arg",
|
|
"command::args",
|
|
"command::status",
|
|
"command::output",
|
|
],
|
|
label: DataLabel::Sink(Cap::SHELL_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &["sink_html"],
|
|
label: DataLabel::Sink(Cap::HTML_ESCAPE),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &[
|
|
"fs::read_to_string",
|
|
"fs::write",
|
|
"fs::read",
|
|
"fs::remove_file",
|
|
"fs::remove_dir",
|
|
"fs::remove_dir_all",
|
|
"fs::rename",
|
|
"fs::copy",
|
|
"File::open",
|
|
"File::create",
|
|
],
|
|
label: DataLabel::Sink(Cap::FILE_IO),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &[
|
|
"reqwest::get",
|
|
"reqwest::Client.execute",
|
|
"reqwest::Client.get",
|
|
"reqwest::Client.post",
|
|
"reqwest::Client.put",
|
|
"reqwest::Client.delete",
|
|
"reqwest::Client.head",
|
|
"reqwest::Client.patch",
|
|
"reqwest::Client.request",
|
|
// Type-qualified (receiver typed as HttpClient)
|
|
"HttpClient.get",
|
|
"HttpClient.post",
|
|
"HttpClient.put",
|
|
"HttpClient.delete",
|
|
"HttpClient.head",
|
|
"HttpClient.patch",
|
|
"HttpClient.request",
|
|
"HttpClient.execute",
|
|
"HttpClient.send",
|
|
],
|
|
label: DataLabel::Sink(Cap::SSRF),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &[
|
|
"rusqlite::Connection.execute",
|
|
"rusqlite::Connection.query",
|
|
"rusqlite::Connection.query_row",
|
|
"rusqlite::Connection.prepare",
|
|
"sqlx::query",
|
|
"sqlx::query_as",
|
|
"sqlx::query_scalar",
|
|
"diesel::sql_query",
|
|
"postgres::Client.execute",
|
|
"postgres::Client.query",
|
|
"postgres::Client.prepare",
|
|
// Type-qualified (receiver typed as DatabaseConnection)
|
|
"DatabaseConnection.execute",
|
|
"DatabaseConnection.query",
|
|
"DatabaseConnection.query_row",
|
|
"DatabaseConnection.prepare",
|
|
],
|
|
label: DataLabel::Sink(Cap::SQL_QUERY),
|
|
case_sensitive: false,
|
|
},
|
|
LabelRule {
|
|
matchers: &[
|
|
"serde_yaml::from_str",
|
|
"serde_yaml::from_slice",
|
|
"serde_yaml::from_reader",
|
|
"bincode::deserialize",
|
|
"bincode::deserialize_from",
|
|
"rmp_serde::from_slice",
|
|
"rmp_serde::from_read",
|
|
"ciborium::from_reader",
|
|
"ron::from_str",
|
|
"toml::from_str",
|
|
],
|
|
label: DataLabel::Sink(Cap::DESERIALIZE),
|
|
case_sensitive: false,
|
|
},
|
|
];
|
|
|
|
pub static KINDS: Map<&'static str, Kind> = phf_map! {
|
|
// control-flow
|
|
"if_expression" => Kind::If,
|
|
"loop_expression" => Kind::InfiniteLoop,
|
|
"while_statement" => Kind::While,
|
|
"while_expression" => Kind::While,
|
|
"for_statement" => Kind::For,
|
|
"for_expression" => Kind::For,
|
|
|
|
"return_statement" => Kind::Return,
|
|
"return_expression" => Kind::Return,
|
|
"break_expression" => Kind::Break,
|
|
"break_statement" => Kind::Break,
|
|
"continue_expression" => Kind::Continue,
|
|
"continue_statement" => Kind::Continue,
|
|
|
|
// structure
|
|
"source_file" => Kind::SourceFile,
|
|
"block" => Kind::Block,
|
|
"else_clause" => Kind::Block,
|
|
"match_expression" => Kind::Block,
|
|
"match_block" => Kind::Block,
|
|
"match_arm" => Kind::Block,
|
|
"unsafe_block" => Kind::Block,
|
|
"function_item" => Kind::Function,
|
|
"closure_expression" => Kind::Function,
|
|
"async_block" => Kind::Block,
|
|
"impl_item" => Kind::Block,
|
|
"trait_item" => Kind::Block,
|
|
"declaration_list" => Kind::Block,
|
|
|
|
// data-flow
|
|
"call_expression" => Kind::CallFn,
|
|
"method_call_expression" => Kind::CallMethod,
|
|
"macro_invocation" => Kind::CallMacro,
|
|
"let_declaration" => Kind::CallWrapper,
|
|
"expression_statement" => Kind::CallWrapper,
|
|
"assignment_expression" => Kind::Assignment,
|
|
|
|
// struct expressions, recurse so env::var() calls inside field
|
|
// initialisers produce Source-labelled CFG nodes (needed for summaries).
|
|
"struct_expression" => Kind::Block,
|
|
"field_initializer_list" => Kind::Block,
|
|
"field_initializer" => Kind::CallWrapper,
|
|
|
|
// trivia
|
|
"line_comment" => Kind::Trivia,
|
|
"block_comment" => Kind::Trivia,
|
|
";" => Kind::Trivia, "," => Kind::Trivia,
|
|
"(" => Kind::Trivia, ")" => Kind::Trivia,
|
|
"{" => Kind::Trivia, "}" => Kind::Trivia, "\n" => Kind::Trivia,
|
|
"use_declaration" => Kind::Trivia,
|
|
"attribute_item" => Kind::Trivia,
|
|
"mod_item" => Kind::Trivia,
|
|
"type_item" => Kind::Trivia,
|
|
};
|
|
|
|
pub static PARAM_CONFIG: ParamConfig = ParamConfig {
|
|
params_field: "parameters",
|
|
param_node_kinds: &["parameter"],
|
|
self_param_kinds: &["self_parameter"],
|
|
ident_fields: &["pattern"],
|
|
};
|
|
|
|
/// Framework-conditional rules for Rust.
|
|
pub fn framework_rules(ctx: &FrameworkContext) -> Vec<RuntimeLabelRule> {
|
|
let mut rules = Vec::new();
|
|
|
|
if ctx.has(DetectedFramework::Axum) {
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec![
|
|
"Path".into(),
|
|
"Query".into(),
|
|
"Json".into(),
|
|
"Form".into(),
|
|
"Multipart".into(),
|
|
"HeaderMap".into(),
|
|
"HeaderMap.get".into(),
|
|
"Request.headers".into(),
|
|
"Request.uri".into(),
|
|
"headers.get".into(),
|
|
],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: true,
|
|
});
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec!["Html".into(), "IntoResponse".into()],
|
|
label: DataLabel::Sink(Cap::HTML_ESCAPE),
|
|
case_sensitive: true,
|
|
});
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec!["Redirect::to".into()],
|
|
label: DataLabel::Sink(Cap::SSRF),
|
|
case_sensitive: true,
|
|
});
|
|
}
|
|
|
|
if ctx.has(DetectedFramework::ActixWeb) {
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec![
|
|
"web::Path".into(),
|
|
"web::Query".into(),
|
|
"web::Json".into(),
|
|
"web::Form".into(),
|
|
"web::Bytes".into(),
|
|
"HttpRequest".into(),
|
|
"HttpRequest.headers".into(),
|
|
"HttpRequest.cookie".into(),
|
|
"HttpRequest.match_info".into(),
|
|
"HttpRequest.query_string".into(),
|
|
],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: true,
|
|
});
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec![
|
|
"HttpResponse.body".into(),
|
|
"HttpResponse.json".into(),
|
|
"HttpResponse.content_type".into(),
|
|
"body".into(),
|
|
"json".into(),
|
|
],
|
|
label: DataLabel::Sink(Cap::HTML_ESCAPE),
|
|
case_sensitive: true,
|
|
});
|
|
}
|
|
|
|
if ctx.has(DetectedFramework::Rocket) {
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec![
|
|
"Json".into(),
|
|
"Form".into(),
|
|
"LenientForm".into(),
|
|
"TempFile".into(),
|
|
"CookieJar".into(),
|
|
"CookieJar.get".into(),
|
|
"CookieJar.get_private".into(),
|
|
"Request.headers".into(),
|
|
"Request.cookies".into(),
|
|
],
|
|
label: DataLabel::Source(Cap::all()),
|
|
case_sensitive: true,
|
|
});
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec!["RawHtml".into(), "content::RawHtml".into(), "Html".into()],
|
|
label: DataLabel::Sink(Cap::HTML_ESCAPE),
|
|
case_sensitive: true,
|
|
});
|
|
rules.push(RuntimeLabelRule {
|
|
matchers: vec!["Redirect::to".into()],
|
|
label: DataLabel::Sink(Cap::SSRF),
|
|
case_sensitive: true,
|
|
});
|
|
}
|
|
|
|
rules
|
|
}
|
|
|
|
/// auth-as-taint label rules for Rust. Gated by
|
|
/// `config.scanner.enable_auth_as_taint`; appended to the runtime rule set
|
|
/// when the flag is enabled. These declare **sinks** (state-changing or
|
|
/// outbound operations that should not be reached by an un-checked
|
|
/// request-bound id) and **sanitizers** (ownership/membership guards that
|
|
/// validate a caller-supplied id).
|
|
pub fn phase_c_auth_rules() -> Vec<RuntimeLabelRule> {
|
|
vec![
|
|
// ── Sinks requiring Cap::UNAUTHORIZED_ID ──
|
|
// Realtime / pub-sub: broadcasting on a caller-supplied group/channel
|
|
// id without first verifying membership is the canonical cross-tenant
|
|
// leak.
|
|
RuntimeLabelRule {
|
|
matchers: vec![
|
|
"realtime::publish".into(),
|
|
"realtime::publish_to_group".into(),
|
|
"realtime::publish_to_channel".into(),
|
|
"realtime::broadcast".into(),
|
|
"broadcaster::send".into(),
|
|
"broadcaster::publish".into(),
|
|
"pubsub::publish".into(),
|
|
],
|
|
label: DataLabel::Sink(Cap::UNAUTHORIZED_ID),
|
|
case_sensitive: false,
|
|
},
|
|
// Database mutations keyed by caller-supplied id. These overlay the
|
|
// existing SQL_QUERY sink declarations (multi-label composition) so
|
|
// a bare id carrying only UNAUTHORIZED_ID still fires.
|
|
RuntimeLabelRule {
|
|
matchers: vec![
|
|
"rusqlite::Connection.execute".into(),
|
|
"postgres::Client.execute".into(),
|
|
"sqlx::query".into(),
|
|
"sqlx::query_as".into(),
|
|
"diesel::insert_into".into(),
|
|
"diesel::update".into(),
|
|
"diesel::delete".into(),
|
|
// Type-qualified (receiver typed as DatabaseConnection)
|
|
"DatabaseConnection.execute".into(),
|
|
"DatabaseConnection.query".into(),
|
|
],
|
|
label: DataLabel::Sink(Cap::UNAUTHORIZED_ID),
|
|
case_sensitive: false,
|
|
},
|
|
// Outbound cache writes.
|
|
RuntimeLabelRule {
|
|
matchers: vec![
|
|
"redis::cmd".into(),
|
|
"cache::set".into(),
|
|
"cache::set_ex".into(),
|
|
"cache::insert".into(),
|
|
],
|
|
label: DataLabel::Sink(Cap::UNAUTHORIZED_ID),
|
|
case_sensitive: false,
|
|
},
|
|
// ── Sanitizers clearing Cap::UNAUTHORIZED_ID ──
|
|
// Ownership and membership guards consumed via call-site
|
|
// argument sanitization (see `is_auth_as_taint_arg_sanitizer`).
|
|
RuntimeLabelRule {
|
|
matchers: vec![
|
|
"check_ownership".into(),
|
|
"has_ownership".into(),
|
|
"require_ownership".into(),
|
|
"ensure_ownership".into(),
|
|
"is_owner".into(),
|
|
"authorize".into(),
|
|
"verify_access".into(),
|
|
"has_permission".into(),
|
|
"can_access".into(),
|
|
"can_manage".into(),
|
|
"require_group_member".into(),
|
|
"require_org_member".into(),
|
|
"require_workspace_member".into(),
|
|
"require_tenant_member".into(),
|
|
"require_team_member".into(),
|
|
"require_membership".into(),
|
|
"check_membership".into(),
|
|
"authz::require".into(),
|
|
"authz::check".into(),
|
|
],
|
|
label: DataLabel::Sanitizer(Cap::UNAUTHORIZED_ID),
|
|
case_sensitive: false,
|
|
},
|
|
]
|
|
}
|