[pitboss] phase 04: Track J.2 + Track L.2 — SSTI corpus + Jinja2 / ERB / Twig / Thymeleaf / Handlebars adapters

This commit is contained in:
pitboss 2026-05-17 18:51:13 -05:00
parent b5e6dddf2c
commit 8583b29796
34 changed files with 1868 additions and 29 deletions

View file

@ -0,0 +1,16 @@
// Phase 04 (Track J.2) Java Thymeleaf benign control fixture.
//
// Renders a fixed template that interpolates the body as a model
// variable; the user-controlled value never reaches the template
// compiler.
import org.thymeleaf.TemplateEngine;
import org.thymeleaf.context.Context;
public class Benign {
public static String run(String body) {
TemplateEngine engine = new TemplateEngine();
Context ctx = new Context();
ctx.setVariable("safeBody", body);
return engine.process("[[${safeBody}]]", ctx);
}
}

View file

@ -0,0 +1,14 @@
// Phase 04 (Track J.2) Java Thymeleaf SSTI vuln fixture.
//
// The body reaches TemplateEngine.process directly, so an attacker
// who controls the body can render arbitrary Thymeleaf expressions.
import org.thymeleaf.TemplateEngine;
import org.thymeleaf.context.Context;
public class Vuln {
public static String run(String body) {
TemplateEngine engine = new TemplateEngine();
Context ctx = new Context();
return engine.process(body, ctx);
}
}

View file

@ -0,0 +1,14 @@
// Phase 04 (Track J.2) — JavaScript Handlebars benign control fixture.
//
// Renders a fixed template that interpolates the body as a context
// variable; the user-controlled value never reaches the template
// compiler.
const Handlebars = require('handlebars');
const template = Handlebars.compile('{{safeBody}}');
function run(body) {
return template({ safeBody: body });
}
module.exports = { run };

View file

@ -0,0 +1,17 @@
// Phase 04 (Track J.2) — JavaScript Handlebars SSTI vuln fixture.
//
// The body is handed straight to Handlebars.compile so an attacker
// who controls the body reaches the template compiler and can render
// arbitrary helper calls.
const Handlebars = require('handlebars');
Handlebars.registerHelper('multiply', function (a, b) {
return Number(a) * Number(b);
});
function run(body) {
const template = Handlebars.compile(body);
return template({});
}
module.exports = { run };

View file

@ -0,0 +1,14 @@
<?php
// Phase 04 (Track J.2) — PHP Twig benign control fixture.
//
// Renders a fixed template that interpolates the user value as a
// variable; the body never reaches the template compiler.
use Twig\Environment;
use Twig\Loader\ArrayLoader;
function run(string $body): string {
$twig = new Environment(new ArrayLoader([
'page' => '{{ safe_body }}',
]));
return $twig->render('page', ['safe_body' => $body]);
}

View file

@ -0,0 +1,14 @@
<?php
// Phase 04 (Track J.2) — PHP Twig SSTI vuln fixture.
//
// The body is handed straight to Twig\Environment::createTemplate so
// an attacker who controls the body reaches Twig's expression
// evaluator and can render arbitrary expressions.
use Twig\Environment;
use Twig\Loader\ArrayLoader;
function run(string $body): string {
$twig = new Environment(new ArrayLoader([]));
$template = $twig->createTemplate($body);
return $template->render([]);
}

View file

@ -0,0 +1,13 @@
"""Phase 04 (Track J.2) — Python Jinja2 benign control fixture.
The function escapes the body as plain text before handing it to a
fixed Jinja2 template that never interpolates the user-controlled
value, so even an SSTI-shaped payload cannot reach the evaluator.
"""
from jinja2 import Template
def run(body: str) -> str:
safe = body.replace("{", "&#123;").replace("}", "&#125;")
template = Template("{{ safe_body | safe }}")
return template.render(safe_body=safe)

View file

@ -0,0 +1,13 @@
"""Phase 04 (Track J.2) — Python Jinja2 SSTI vuln fixture.
The function pulls a template body off the request and pipes it
straight into `jinja2.Template(...).render()` without sandboxing or
expression filtering, so an attacker who controls the body reaches the
expression evaluator and can render arbitrary expressions.
"""
from jinja2 import Template
def run(body: str) -> str:
template = Template(body)
return template.render()

View file

@ -0,0 +1,11 @@
# Phase 04 (Track J.2) — Ruby ERB benign control fixture.
#
# Escapes ERB markers in the body before rendering through a fixed
# template that interpolates only the sanitised value, so SSTI-shaped
# input cannot reach the evaluator.
require 'erb'
def run(body)
safe_body = body.gsub(/<%/, '&lt;%').gsub(/%>/, '%&gt;')
ERB.new('<%= safe_body %>').result(binding)
end

View file

@ -0,0 +1,9 @@
# Phase 04 (Track J.2) — Ruby ERB SSTI vuln fixture.
#
# The body is handed straight to ERB.new(...).result so an attacker
# who controls the body reaches the Ruby expression evaluator.
require 'erb'
def run(body)
ERB.new(body).result
end

300
tests/ssti_corpus.rs Normal file
View file

@ -0,0 +1,300 @@
//! Phase 04 (Track J.2) — SSTI corpus acceptance.
//!
//! Asserts the new cap end-to-end: corpus slices register per-engine
//! vuln/benign pairs (Python/Jinja2, Ruby/ERB, PHP/Twig, Java/Thymeleaf,
//! JS/Handlebars), the lang-aware resolver pairs them inside the
//! correct slice, the per-language harness emitters splice in the
//! synthetic template renderer + sink-hit sentinel, and the
//! framework adapters fire on the canonical sink call.
//!
//! `cargo nextest run --features dynamic --test ssti_corpus`.
#![cfg(feature = "dynamic")]
use nyx_scanner::dynamic::corpus::{
audit_marker_collisions, benign_payload_for_lang, payloads_for_lang,
resolve_benign_control_lang, Oracle,
};
use nyx_scanner::dynamic::framework::registry::adapters_for;
use nyx_scanner::dynamic::lang;
use nyx_scanner::dynamic::oracle::{oracle_fired, ProbePredicate};
use nyx_scanner::dynamic::sandbox::SandboxOutcome;
use nyx_scanner::dynamic::spec::{EntryKind, HarnessSpec, PayloadSlot};
use nyx_scanner::labels::Cap;
use nyx_scanner::summary::FuncSummary;
use nyx_scanner::symbol::Lang;
use std::time::Duration;
const LANGS: &[Lang] = &[
Lang::Python,
Lang::Ruby,
Lang::Php,
Lang::Java,
Lang::JavaScript,
];
fn make_spec(lang: Lang, entry_file: &str, entry_name: &str) -> HarnessSpec {
HarnessSpec {
finding_id: "phase04test0001".into(),
entry_file: entry_file.into(),
entry_name: entry_name.into(),
entry_kind: EntryKind::Function,
lang,
toolchain_id: "phase04".into(),
payload_slot: PayloadSlot::Param(0),
expected_cap: Cap::SSTI,
constraint_hints: vec![],
sink_file: entry_file.into(),
sink_line: 1,
spec_hash: "phase04test0001".into(),
derivation: nyx_scanner::dynamic::spec::SpecDerivationStrategy::FromFlowSteps,
stubs_required: vec![],
framework: None,
}
}
#[test]
fn corpus_registers_ssti_for_every_supported_lang() {
for lang in LANGS {
let slice = payloads_for_lang(Cap::SSTI, *lang);
assert!(!slice.is_empty(), "SSTI has no payloads for {lang:?}");
let has_vuln = slice.iter().any(|p| !p.is_benign);
let has_benign = slice.iter().any(|p| p.is_benign);
assert!(has_vuln, "{lang:?} SSTI missing vuln payload");
assert!(has_benign, "{lang:?} SSTI missing benign control");
}
}
#[test]
fn ssti_unsupported_caps_unchanged_for_other_langs() {
// Phase 04 only fills Python/Ruby/PHP/Java/JS — TypeScript / Rust /
// C / Cpp / Go remain empty.
for lang in [
Lang::Rust,
Lang::C,
Lang::Cpp,
Lang::Go,
Lang::TypeScript,
] {
assert!(
payloads_for_lang(Cap::SSTI, lang).is_empty(),
"unexpected SSTI payloads registered for {lang:?}",
);
}
}
#[test]
fn benign_control_resolves_within_lang_slice() {
for lang in LANGS {
let slice = payloads_for_lang(Cap::SSTI, *lang);
let vuln = slice.iter().find(|p| !p.is_benign).unwrap();
let resolved =
resolve_benign_control_lang(vuln, Cap::SSTI, *lang).expect("paired control");
assert!(resolved.is_benign);
let direct = benign_payload_for_lang(Cap::SSTI, *lang).unwrap();
assert_eq!(direct.label, resolved.label);
}
}
#[test]
fn payload_oracle_carries_template_eval_predicate() {
for lang in LANGS {
let slice = payloads_for_lang(Cap::SSTI, *lang);
let vuln = slice.iter().find(|p| !p.is_benign).unwrap();
match &vuln.oracle {
Oracle::SinkProbe { predicates } => {
let has_predicate = predicates.iter().any(|p| {
matches!(p, ProbePredicate::TemplateEvalEqual { expected: 49 })
});
assert!(
has_predicate,
"{lang:?} vuln payload missing TemplateEvalEqual{{expected:49}}",
);
}
other => panic!("expected SinkProbe oracle for {lang:?}, got {other:?}"),
}
}
}
#[test]
fn marker_collisions_clean_with_phase_04_additions() {
assert!(audit_marker_collisions().is_empty());
}
#[test]
fn template_eval_equal_fires_on_render_49_json() {
// The oracle parses the harness's stdout body as JSON; a vuln
// payload run that renders `49` satisfies the predicate.
let oracle = Oracle::SinkProbe {
predicates: &[ProbePredicate::TemplateEvalEqual { expected: 49 }],
};
let outcome = SandboxOutcome {
exit_code: Some(0),
stdout: br#"__NYX_SINK_HIT__
{"render":"49"}
"#
.to_vec(),
stderr: vec![],
timed_out: false,
oob_callback_seen: false,
sink_hit: true,
duration: Duration::from_millis(1),
hardening_outcome: None,
};
assert!(oracle_fired(&oracle, &outcome, &[]));
}
#[test]
fn template_eval_equal_does_not_fire_on_echo_render() {
// The benign payload echoes literal `7*7`; the integer parse
// fails so the predicate does not satisfy.
let oracle = Oracle::SinkProbe {
predicates: &[ProbePredicate::TemplateEvalEqual { expected: 49 }],
};
let outcome = SandboxOutcome {
exit_code: Some(0),
stdout: br#"__NYX_SINK_HIT__
{"render":"7*7"}
"#
.to_vec(),
stderr: vec![],
timed_out: false,
oob_callback_seen: false,
sink_hit: true,
duration: Duration::from_millis(1),
hardening_outcome: None,
};
assert!(!oracle_fired(&oracle, &outcome, &[]));
}
#[test]
fn lang_emitter_dispatches_to_ssti_harness() {
for (lang, entry_file, entry_name, marker) in [
(
Lang::Python,
"tests/dynamic_fixtures/ssti/python_jinja2/vuln.py",
"run",
"_nyx_jinja2_render",
),
(
Lang::Ruby,
"tests/dynamic_fixtures/ssti/ruby_erb/vuln.rb",
"run",
"_nyx_erb_render",
),
(
Lang::Php,
"tests/dynamic_fixtures/ssti/php_twig/vuln.php",
"run",
"_nyx_twig_render",
),
(
Lang::Java,
"tests/dynamic_fixtures/ssti/java_thymeleaf/vuln.java",
"run",
"nyxThymeleafRender",
),
(
Lang::JavaScript,
"tests/dynamic_fixtures/ssti/js_handlebars/vuln.js",
"run",
"nyxHandlebarsRender",
),
] {
let spec = make_spec(lang, entry_file, entry_name);
let harness = lang::emit(&spec)
.unwrap_or_else(|e| panic!("emit failed for {lang:?}: {e:?}"));
assert!(
harness.source.contains(marker),
"{lang:?} ssti harness must splice {marker:?}",
);
assert!(
harness.source.contains("__NYX_SINK_HIT__"),
"{lang:?} ssti harness must emit the sink-hit sentinel",
);
assert!(
harness.source.contains("render"),
"{lang:?} ssti harness must print the render JSON field",
);
}
}
#[test]
fn framework_adapters_detect_ssti_sink() {
// Each lang registers its J.2 SSTI sink adapter; detect_binding
// routes through the registry and stamps an EntryKind::Function
// binding when the fixture contains the canonical sink call.
for (lang, fixture) in [
(
Lang::Python,
"tests/dynamic_fixtures/ssti/python_jinja2/vuln.py",
),
(Lang::Ruby, "tests/dynamic_fixtures/ssti/ruby_erb/vuln.rb"),
(Lang::Php, "tests/dynamic_fixtures/ssti/php_twig/vuln.php"),
(
Lang::Java,
"tests/dynamic_fixtures/ssti/java_thymeleaf/vuln.java",
),
(
Lang::JavaScript,
"tests/dynamic_fixtures/ssti/js_handlebars/vuln.js",
),
] {
let bytes = std::fs::read(fixture).expect("fixture exists");
let ts_lang = ts_language_for(lang);
let mut parser = tree_sitter::Parser::new();
parser.set_language(&ts_lang).unwrap();
let tree = parser.parse(&bytes, None).unwrap();
let mut summary = FuncSummary {
name: "run".into(),
file_path: fixture.to_owned(),
lang: slug(lang).into(),
..Default::default()
};
// Seed the canonical sink callee per language so the
// callee-side matcher fires alongside the source-side check.
let sink_callee = match lang {
Lang::Python => "Template",
Lang::Ruby => "new",
Lang::Php => "createTemplate",
Lang::Java => "process",
Lang::JavaScript => "compile",
_ => unreachable!(),
};
summary
.callees
.push(nyx_scanner::summary::CalleeSite::bare(sink_callee));
let registry_slice = adapters_for(lang);
assert!(!registry_slice.is_empty(), "{lang:?} adapter slice empty");
let binding =
nyx_scanner::dynamic::framework::detect_binding(&summary, tree.root_node(), &bytes, lang);
let b =
binding.unwrap_or_else(|| panic!("{lang:?} adapter must detect the SSTI fixture"));
assert_eq!(b.kind, EntryKind::Function);
assert!(!b.adapter.is_empty());
}
}
fn ts_language_for(lang: Lang) -> tree_sitter::Language {
match lang {
Lang::Python => tree_sitter::Language::from(tree_sitter_python::LANGUAGE),
Lang::Ruby => tree_sitter::Language::from(tree_sitter_ruby::LANGUAGE),
Lang::Php => tree_sitter::Language::from(tree_sitter_php::LANGUAGE_PHP),
Lang::Java => tree_sitter::Language::from(tree_sitter_java::LANGUAGE),
Lang::JavaScript => {
tree_sitter::Language::from(tree_sitter_javascript::LANGUAGE)
}
other => panic!("unsupported test lang {other:?}"),
}
}
fn slug(lang: Lang) -> &'static str {
match lang {
Lang::Python => "python",
Lang::Ruby => "ruby",
Lang::Php => "php",
Lang::Java => "java",
Lang::JavaScript => "javascript",
_ => "other",
}
}