huskies: merge 1026

This commit is contained in:
dave
2026-05-14 12:53:14 +00:00
parent a80d0a497a
commit 72d79deec9
13 changed files with 1443 additions and 127 deletions
+28 -23
View File
@@ -6,38 +6,27 @@
use crate::http::context::AppContext;
use crate::http::workflow::create_epic_file;
use crate::validation::CreateEpicRequest;
use serde_json::{Value, json};
/// Create a new epic and store it in the CRDT items list.
pub(crate) fn tool_create_epic(args: &Value, ctx: &AppContext) -> Result<String, String> {
let name = args
.get("name")
.and_then(|v| v.as_str())
.ok_or("Missing required argument: name")?;
let goal = args
.get("goal")
.and_then(|v| v.as_str())
.ok_or("Missing required argument: goal")?;
let motivation = args.get("motivation").and_then(|v| v.as_str());
let key_files = args.get("key_files").and_then(|v| v.as_str());
let success_criteria: Option<Vec<String>> = args
.get("success_criteria")
.and_then(|v| v.as_array())
.map(|arr| {
arr.iter()
.filter_map(|v| v.as_str().map(str::to_string))
.collect()
});
let req = CreateEpicRequest::from_json(args)?;
let root = ctx.state.get_project_root()?;
let success_criteria = req.success_criteria_strings();
let epic_id = create_epic_file(
&root,
name,
goal,
motivation,
key_files,
success_criteria.as_deref(),
req.name.as_ref(),
req.goal.as_str(),
req.motivation.as_ref().map(|d| d.as_ref()),
req.key_files.as_deref(),
if success_criteria.is_empty() {
None
} else {
Some(success_criteria.as_slice())
},
)?;
Ok(format!("Created epic: {epic_id}"))
@@ -204,6 +193,22 @@ mod tests {
assert!(result.unwrap_err().contains("goal"));
}
#[test]
fn tool_create_epic_rejects_grammar_token_in_name() {
let tmp = tempfile::tempdir().unwrap();
let ctx = test_ctx(tmp.path());
let result = tool_create_epic(
&json!({"name": "Epic </description> bad", "goal": "some goal"}),
&ctx,
);
assert!(result.is_err());
assert!(
result.unwrap_err().contains("AntiGrammarToken"),
"expected AntiGrammarToken error"
);
}
#[test]
fn tool_list_epics_includes_created_epic() {
let tmp = tempfile::tempdir().unwrap();
+82 -47
View File
@@ -3,55 +3,36 @@
use crate::http::context::AppContext;
use crate::http::workflow::create_story_file;
use crate::slog_warn;
use crate::validation::CreateStoryRequest;
use serde_json::Value;
/// Create a new story in the backlog.
///
/// Deserialises the JSON arguments into a `CreateStoryRequest`, runs the full
/// validation pipeline (field-level newtypes + cross-field garde rules), then
/// delegates to `create_story_file` / `create_item_in_backlog`. All ad-hoc
/// string checks have been removed; `CreateStoryRequest` is now the sole gate.
pub(crate) fn tool_create_story(args: &Value, ctx: &AppContext) -> Result<String, String> {
let name = args
.get("name")
.and_then(|v| v.as_str())
.ok_or("Missing required argument: name")?;
let user_story = args.get("user_story").and_then(|v| v.as_str());
let description = args.get("description").and_then(|v| v.as_str());
let acceptance_criteria: Vec<String> = args
.get("acceptance_criteria")
.and_then(|v| serde_json::from_value(v.clone()).ok())
.ok_or("Missing required argument: acceptance_criteria")?;
if acceptance_criteria.is_empty() {
return Err("acceptance_criteria must contain at least one entry".to_string());
}
const JUNK_AC: &[&str] = &["", "todo", "tbd", "fixme", "xxx", "???"];
let all_junk = acceptance_criteria
.iter()
.all(|ac| JUNK_AC.contains(&ac.trim().to_lowercase().as_str()));
if all_junk {
return Err(
"acceptance_criteria must contain at least one real entry (not just TODO/TBD/FIXME/XXX/???)."
.to_string(),
);
}
let depends_on: Option<Vec<u32>> = args
.get("depends_on")
.and_then(|v| serde_json::from_value(v.clone()).ok());
// Spike 61: write the file only — the filesystem watcher detects the new
// .md file in work/1_backlog/ and auto-commits with a deterministic message.
let commit = false;
let req = CreateStoryRequest::from_json(args)?;
let root = ctx.state.get_project_root()?;
let depends_on_ids = req.depends_on_ids();
let story_id = create_story_file(
&root,
name,
user_story,
description,
&acceptance_criteria,
depends_on.as_deref(),
commit,
req.name.as_ref(),
req.user_story.as_ref().map(|d| d.as_ref()),
req.description.as_ref().map(|d| d.as_ref()),
&req.acceptance_criteria
.iter()
.map(|ac| ac.as_ref().to_string())
.collect::<Vec<_>>(),
depends_on_ids.as_deref(),
false,
)?;
// Bug 503: warn at creation time if any depends_on points at an already-archived story.
// Archived = satisfied semantics: the dep will resolve immediately on the next promotion
// tick, which is surprising if the archived story was abandoned rather than cleanly done.
// Story 929: dep archived-status now comes from the CRDT, not a FS scan of 6_archived/.
let archived_deps: Vec<u32> = depends_on
let archived_deps: Vec<u32> = depends_on_ids
.as_deref()
.map(|deps| {
deps.iter()
@@ -199,7 +180,11 @@ mod tests {
let ctx = test_ctx(tmp.path());
let result = tool_create_story(&json!({}), &ctx);
assert!(result.is_err());
assert!(result.unwrap_err().contains("Missing required argument"));
let err = result.unwrap_err();
assert!(
err.contains("FieldMissing") || err.contains("name"),
"expected FieldMissing/name in: {err}"
);
}
#[test]
@@ -211,7 +196,6 @@ mod tests {
&ctx,
);
assert!(result.is_err());
assert!(result.unwrap_err().contains("alphanumeric"));
}
#[test]
@@ -224,8 +208,8 @@ mod tests {
)
.unwrap_err();
assert!(
err.contains("empty") || err.contains("whitespace"),
"error should mention empty/whitespace, got: {err}"
err.contains("EmptyAfterTrim") || err.contains("empty") || err.contains("whitespace"),
"error should mention EmptyAfterTrim/empty/whitespace, got: {err}"
);
}
@@ -277,10 +261,6 @@ mod tests {
&ctx,
);
assert!(result.is_err());
assert!(
result.unwrap_err().contains("real entry"),
"error should mention real entry"
);
}
#[test]
@@ -326,4 +306,59 @@ mod tests {
"Description text missing from story: {content}"
);
}
#[test]
fn tool_create_story_rejects_grammar_token_in_name() {
let tmp = tempfile::tempdir().unwrap();
let ctx = test_ctx(tmp.path());
let err = tool_create_story(
&json!({
"name": "Bad </description> Story",
"acceptance_criteria": ["AC1"]
}),
&ctx,
)
.unwrap_err();
assert!(
err.contains("AntiGrammarToken") || err.contains("grammar"),
"expected grammar-token error, got: {err}"
);
}
#[test]
fn tool_create_story_rejects_grammar_token_in_ac() {
let tmp = tempfile::tempdir().unwrap();
let ctx = test_ctx(tmp.path());
let err = tool_create_story(
&json!({
"name": "Valid Story",
"acceptance_criteria": ["<thinking>bad output</thinking>"]
}),
&ctx,
)
.unwrap_err();
assert!(
err.contains("AntiGrammarToken") || err.contains("grammar"),
"expected grammar-token error, got: {err}"
);
}
#[test]
fn tool_create_story_html_sanitised_in_name() {
let tmp = tempfile::tempdir().unwrap();
let ctx = test_ctx(tmp.path());
// HTML in name is sanitised (not rejected)
let result = tool_create_story(
&json!({
"name": "Story with <b>bold</b> name",
"acceptance_criteria": ["AC1"]
}),
&ctx,
);
// Should succeed (HTML is sanitised, not rejected)
assert!(
result.is_ok(),
"HTML in name should be sanitised: {result:?}"
);
}
}
+50 -52
View File
@@ -6,11 +6,16 @@
use std::path::Path;
use super::super::{next_item_number, slugify_name, write_story_content};
use super::super::create_item_in_backlog;
/// Create an epic file and store it in the database.
/// Create an epic file, storing it in the database via `create_item_in_backlog`.
///
/// Returns the epic_id (e.g. `"880"`).
/// Routes through `create_item_in_backlog` so that the tombstone-skip allocator
/// defence and post-write CRDT verification (added by bug 1001's fix) apply to
/// epics too. Previously this function had its own ad-hoc allocate-and-write
/// path that bypassed those safety checks.
///
/// Returns the epic_id (numeric only, e.g. `"880"`).
pub fn create_epic_file(
root: &Path,
name: &str,
@@ -19,61 +24,54 @@ pub fn create_epic_file(
key_files: Option<&str>,
success_criteria: Option<&[String]>,
) -> Result<String, String> {
let epic_number = next_item_number(root)?;
let slug = slugify_name(name);
let name_owned = name.to_string();
let goal_owned = goal.to_string();
let motivation_owned = motivation.map(str::to_string);
let key_files_owned = key_files.map(str::to_string);
let success_criteria_owned: Vec<String> =
success_criteria.map(|sc| sc.to_vec()).unwrap_or_default();
if slug.is_empty() {
return Err("Name must contain at least one alphanumeric character.".to_string());
}
// Epics don't have acceptance criteria; pass an empty slice.
// create_item_in_backlog skips the AC check for type "epic".
create_item_in_backlog(root, "epic", name, &[], None, move |epic_number| {
let mut content = String::new();
content.push_str("---\n");
content.push_str("type: epic\n");
content.push_str(&format!("name: \"{}\"\n", name_owned.replace('"', "\\\"")));
content.push_str("---\n\n");
content.push_str(&format!("# Epic {epic_number}: {name_owned}\n\n"));
let epic_id = format!("{epic_number}");
content.push_str("## Goal\n\n");
content.push_str(&goal_owned);
content.push_str("\n\n");
let mut content = String::new();
content.push_str("---\n");
content.push_str("type: epic\n");
content.push_str(&format!("name: \"{}\"\n", name.replace('"', "\\\"")));
content.push_str("---\n\n");
content.push_str(&format!("# Epic {epic_number}: {name}\n\n"));
content.push_str("## Goal\n\n");
content.push_str(goal);
content.push_str("\n\n");
content.push_str("## Motivation\n\n");
if let Some(m) = motivation {
content.push_str(m);
content.push('\n');
} else {
content.push_str("- TBD\n");
}
content.push('\n');
content.push_str("## Key Files\n\n");
if let Some(kf) = key_files {
content.push_str(kf);
content.push('\n');
} else {
content.push_str("- TBD\n");
}
content.push('\n');
content.push_str("## Success Criteria\n\n");
match success_criteria {
Some(criteria) if !criteria.is_empty() => {
for c in criteria {
content.push_str(&format!("- {c}\n"));
}
}
_ => {
content.push_str("## Motivation\n\n");
if let Some(ref m) = motivation_owned {
content.push_str(m);
content.push('\n');
} else {
content.push_str("- TBD\n");
}
}
content.push('\n');
// Epics are stored in backlog (no pipeline advancement).
write_story_content(root, &epic_id, "1_backlog", &content, Some(name));
content.push_str("## Key Files\n\n");
if let Some(ref kf) = key_files_owned {
content.push_str(kf);
content.push('\n');
} else {
content.push_str("- TBD\n");
}
content.push('\n');
// Story 933: typed CRDT register for item_type.
crate::crdt_state::set_item_type(&epic_id, Some(crate::io::story_metadata::ItemType::Epic));
content.push_str("## Success Criteria\n\n");
if !success_criteria_owned.is_empty() {
for c in &success_criteria_owned {
content.push_str(&format!("- {c}\n"));
}
} else {
content.push_str("- TBD\n");
}
Ok(epic_id)
content
})
}
+7 -5
View File
@@ -250,15 +250,17 @@ pub(crate) fn create_item_in_backlog(
if slugify_name(name).is_empty() {
return Err("Title must contain at least one alphanumeric character.".to_string());
}
if acceptance_criteria.is_empty() {
return Err("At least one acceptance criterion is required.".to_string());
}
const VALID_TYPES: &[&str] = &["story", "bug", "spike", "refactor"];
const VALID_TYPES: &[&str] = &["story", "bug", "spike", "refactor", "epic"];
if !VALID_TYPES.contains(&item_type) {
return Err(format!(
"Invalid item type '{item_type}': must be one of story, bug, spike, refactor."
"Invalid item type '{item_type}': must be one of story, bug, spike, refactor, epic."
));
}
// Epics use success_criteria (optional); the acceptance_criteria check is
// only meaningful for pipeline work items.
if item_type != "epic" && acceptance_criteria.is_empty() {
return Err("At least one acceptance criterion is required.".to_string());
}
let item_number = next_item_number(root)?;
let item_id = format!("{item_number}");
+2
View File
@@ -43,6 +43,8 @@ pub mod sled_uplink;
mod startup;
mod state;
mod store;
/// Validated input layer — transport-agnostic newtypes and request structs for all MCP write tools.
pub mod validation;
mod workflow;
mod worktree;
+127
View File
@@ -0,0 +1,127 @@
//! Typed validation error enum returned from all MCP write-tool input validation.
use serde::{Deserialize, Serialize};
use std::fmt;
/// Structured error from input validation.
///
/// Each variant carries exactly the data a caller needs to act on the error.
/// Serialises to serde's default externally-tagged form, e.g.
/// `{"FieldTooLong":{"field":"description","max":200,"actual":287}}`.
/// Callers can pattern-match on the JSON tag without parsing prose.
#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub enum ValidationError {
/// A required field was absent from the input.
FieldMissing { field: String },
/// A field value is empty (or whitespace-only) after trimming.
EmptyAfterTrim { field: String },
/// A field value exceeds the maximum allowed length.
FieldTooLong {
field: String,
max: usize,
actual: usize,
},
/// A field value contains a character outside the allowed set.
InvalidCharacter {
field: String,
ch: char,
position: usize,
},
/// A field value contains a tool-call grammar fragment that must be rejected.
AntiGrammarToken { field: String, token: String },
/// A numeric field value is outside its allowed range.
OutOfRange {
field: String,
min: i64,
max: i64,
actual: i64,
},
/// A list field has fewer items than the minimum.
TooFewItems {
field: String,
min: usize,
actual: usize,
},
/// A list field has more items than the maximum.
TooManyItems {
field: String,
max: usize,
actual: usize,
},
/// A field value is not valid UTF-8.
InvalidUtf8 { field: String },
/// A `depends_on` entry references the same item being created or updated.
SelfReference { field: String },
}
impl fmt::Display for ValidationError {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
match self {
Self::FieldMissing { field } => {
write!(f, "field '{field}' is required but was not provided")
}
Self::EmptyAfterTrim { field } => {
write!(f, "field '{field}' must not be empty or whitespace-only")
}
Self::FieldTooLong { field, max, actual } => {
write!(f, "field '{field}' is too long ({actual} chars, max {max})")
}
Self::InvalidCharacter {
field,
ch,
position,
} => {
write!(
f,
"field '{field}' contains invalid character {ch:?} at position {position}"
)
}
Self::AntiGrammarToken { field, token } => {
write!(
f,
"field '{field}' contains a tool-call grammar fragment: {token:?}"
)
}
Self::OutOfRange {
field,
min,
max,
actual,
} => {
write!(
f,
"field '{field}' value {actual} is out of allowed range [{min}, {max}]"
)
}
Self::TooFewItems { field, min, actual } => {
write!(
f,
"field '{field}' has too few items ({actual}; minimum {min})"
)
}
Self::TooManyItems { field, max, actual } => {
write!(
f,
"field '{field}' has too many items ({actual}; maximum {max})"
)
}
Self::InvalidUtf8 { field } => {
write!(f, "field '{field}' contains invalid UTF-8")
}
Self::SelfReference { field } => {
write!(
f,
"field '{field}' contains a self-reference (depends on itself)"
)
}
}
}
}
/// Serialise a slice of validation errors as a pretty-printed JSON string.
///
/// Used to turn `Vec<ValidationError>` into the `Err(String)` value returned by
/// MCP tool handlers.
pub fn format_errors_as_json(errors: &[ValidationError]) -> String {
serde_json::to_string_pretty(errors).unwrap_or_else(|_| format!("{errors:?}"))
}
+22
View File
@@ -0,0 +1,22 @@
//! Transport-agnostic validated input layer for MCP write tools.
//!
//! This module houses all input validation primitives shared across MCP, HTTP,
//! and future WebSocket callers. It is intentionally decoupled from any
//! specific transport — callers parse their raw input into the request types
//! here and receive either a validated struct or a `Vec<ValidationError>`.
//!
//! # Structure
//!
//! - [`error`] — [`ValidationError`] typed enum + JSON serialisation helpers.
//! - [`sanitize`] — HTML sanitisation via `ammonia`.
//! - [`newtypes`] — field-level newtypes (`StoryName`, `AcceptanceCriterion`, …).
//! - [`requests`] — top-level request structs with cross-field `garde` rules.
mod error;
mod newtypes;
mod requests;
mod sanitize;
pub use error::{ValidationError, format_errors_as_json};
pub use newtypes::{AcceptanceCriterion, DependsOnId, Description, StoryName};
pub use requests::{CreateEpicRequest, CreateStoryRequest};
+397
View File
@@ -0,0 +1,397 @@
//! Validated input newtypes for MCP write tools.
//!
//! Each newtype's inner value is guaranteed valid once constructed — the only
//! public constructors run the full validation pipeline. Use the associated
//! `parse` or `parse_with_field` methods (which return rich `Vec<ValidationError>`)
//! in preference to nutype's lower-level `new()`.
use nutype::nutype;
use serde::{Deserialize, Serialize};
use super::error::ValidationError;
use super::sanitize;
/// Tool-call grammar fragments that must be rejected in any text field.
///
/// These are hallucination artifacts from the LLM (bug 1001): if they appear
/// in a field value the whole call is malformed bot output, not user content.
const ANTI_GRAMMAR_TOKENS: &[&str] = &[
"</description>",
"<parameter name=",
"<thinking>",
"</thinking>",
"<assistant>",
"</assistant>",
"<tool_use>",
"</tool_use>",
"<tool_result>",
"</tool_result>",
"<function_calls>",
"</function_calls>",
"<invoke>",
"</invoke>",
];
/// Maximum length (chars) for a story/epic name.
pub(super) const NAME_MAX_LEN: usize = 200;
/// Maximum length (chars) for a description / goal / motivation field.
pub(super) const DESCRIPTION_MAX_LEN: usize = 4000;
/// Maximum length (chars) for a single acceptance criterion.
pub(super) const AC_MAX_LEN: usize = 1000;
/// Scan `value` for any anti-grammar-token and return errors if found.
fn check_grammar_tokens(field: &str, value: &str) -> Vec<ValidationError> {
ANTI_GRAMMAR_TOKENS
.iter()
.filter(|&&token| value.contains(token))
.map(|&token| ValidationError::AntiGrammarToken {
field: field.to_string(),
token: token.to_string(),
})
.collect()
}
// ---------------------------------------------------------------------------
// StoryName newtype
// ---------------------------------------------------------------------------
fn is_story_name_nonempty(val: &str) -> bool {
!val.is_empty()
}
#[nutype(
sanitize(trim),
validate(predicate = is_story_name_nonempty),
derive(Debug, Clone, PartialEq, Serialize, Deserialize, AsRef)
)]
/// A validated, trimmed story or epic name.
pub struct StoryName(String);
impl StoryName {
/// Parse a raw string as a story name, returning all validation errors found.
///
/// Checks anti-grammar tokens first (on the raw trimmed value), then HTML-sanitises,
/// then validates length and non-emptiness.
pub fn parse(raw: &str) -> Result<Self, Vec<ValidationError>> {
let trimmed = raw.trim();
// Anti-grammar check on original trimmed value — must precede HTML sanitise
// because ammonia would strip the tokens before we could detect them.
let grammar_errors = check_grammar_tokens("name", trimmed);
if !grammar_errors.is_empty() {
return Err(grammar_errors);
}
let (sanitized, _) = sanitize::sanitize_html("name", trimmed);
let mut errors = Vec::new();
if sanitized.is_empty() {
errors.push(ValidationError::EmptyAfterTrim {
field: "name".into(),
});
} else if sanitized.len() > NAME_MAX_LEN {
errors.push(ValidationError::FieldTooLong {
field: "name".into(),
max: NAME_MAX_LEN,
actual: sanitized.len(),
});
}
if !errors.is_empty() {
return Err(errors);
}
// nutype's sanitize(trim) is idempotent; predicate passes since we already checked.
StoryName::try_new(sanitized).map_err(|_e| {
vec![ValidationError::EmptyAfterTrim {
field: "name".into(),
}]
})
}
}
// ---------------------------------------------------------------------------
// AcceptanceCriterion newtype
// ---------------------------------------------------------------------------
fn is_ac_nonempty(val: &str) -> bool {
!val.is_empty()
}
#[nutype(
sanitize(trim),
validate(predicate = is_ac_nonempty),
derive(Debug, Clone, PartialEq, Serialize, Deserialize, AsRef)
)]
/// A single validated acceptance criterion.
pub struct AcceptanceCriterion(String);
impl AcceptanceCriterion {
/// Parse a single raw acceptance criterion string, using `field` in error messages.
pub fn parse(field: &str, raw: &str) -> Result<Self, Vec<ValidationError>> {
let trimmed = raw.trim();
let grammar_errors = check_grammar_tokens(field, trimmed);
if !grammar_errors.is_empty() {
return Err(grammar_errors);
}
let (sanitized, _) = sanitize::sanitize_html(field, trimmed);
let mut errors = Vec::new();
if sanitized.is_empty() {
errors.push(ValidationError::EmptyAfterTrim {
field: field.to_string(),
});
} else if sanitized.len() > AC_MAX_LEN {
errors.push(ValidationError::FieldTooLong {
field: field.to_string(),
max: AC_MAX_LEN,
actual: sanitized.len(),
});
}
if !errors.is_empty() {
return Err(errors);
}
AcceptanceCriterion::try_new(sanitized).map_err(|_e| {
vec![ValidationError::EmptyAfterTrim {
field: field.to_string(),
}]
})
}
}
// ---------------------------------------------------------------------------
// Description newtype (used for description, user_story, goal, motivation)
// ---------------------------------------------------------------------------
/// A validated trimmed description / goal / motivation text.
///
/// The field name is not embedded in the type; pass it to `parse`.
#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub struct Description(String);
impl Description {
/// Parse and validate a description field value.
///
/// `field` is used in error messages (e.g. `"description"`, `"goal"`).
pub fn parse(field: &str, raw: &str) -> Result<Self, Vec<ValidationError>> {
let trimmed = raw.trim();
let grammar_errors = check_grammar_tokens(field, trimmed);
if !grammar_errors.is_empty() {
return Err(grammar_errors);
}
let (sanitized, _) = sanitize::sanitize_html(field, trimmed);
let mut errors = Vec::new();
if sanitized.is_empty() {
errors.push(ValidationError::EmptyAfterTrim {
field: field.to_string(),
});
} else if sanitized.len() > DESCRIPTION_MAX_LEN {
errors.push(ValidationError::FieldTooLong {
field: field.to_string(),
max: DESCRIPTION_MAX_LEN,
actual: sanitized.len(),
});
}
if !errors.is_empty() {
Err(errors)
} else {
Ok(Description(sanitized))
}
}
/// Return the inner string value.
pub fn as_str(&self) -> &str {
&self.0
}
}
impl AsRef<str> for Description {
fn as_ref(&self) -> &str {
&self.0
}
}
// ---------------------------------------------------------------------------
// DependsOnId newtype
// ---------------------------------------------------------------------------
fn is_nonzero_dep_id(val: &u32) -> bool {
*val != 0
}
#[nutype(
validate(predicate = is_nonzero_dep_id),
derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)
)]
/// A validated non-zero story/item dependency ID.
pub struct DependsOnId(u32);
impl DependsOnId {
/// Parse a raw `u32` as a dependency ID, using `field` in error messages.
pub fn parse(field: &str, id: u32) -> Result<Self, Vec<ValidationError>> {
if id == 0 {
return Err(vec![ValidationError::OutOfRange {
field: field.to_string(),
min: 1,
max: i64::from(u32::MAX),
actual: 0,
}]);
}
DependsOnId::try_new(id).map_err(|_| {
vec![ValidationError::OutOfRange {
field: field.to_string(),
min: 1,
max: i64::from(u32::MAX),
actual: i64::from(id),
}]
})
}
/// Return the raw inner value.
pub fn get(self) -> u32 {
self.into_inner()
}
}
#[cfg(test)]
mod tests {
use super::*;
// --- StoryName ---
#[test]
fn story_name_rejects_empty() {
let err = StoryName::parse("").unwrap_err();
assert!(matches!(err[0], ValidationError::EmptyAfterTrim { .. }));
}
#[test]
fn story_name_rejects_whitespace_only() {
let err = StoryName::parse(" ").unwrap_err();
assert!(matches!(err[0], ValidationError::EmptyAfterTrim { .. }));
}
#[test]
fn story_name_accepts_valid() {
let n = StoryName::parse("My Story").unwrap();
assert_eq!(n.as_ref(), "My Story");
}
#[test]
fn story_name_trims_whitespace() {
let n = StoryName::parse(" Trimmed ").unwrap();
assert_eq!(n.as_ref(), "Trimmed");
}
#[test]
fn story_name_rejects_too_long() {
let long = "x".repeat(NAME_MAX_LEN + 1);
let err = StoryName::parse(&long).unwrap_err();
assert!(matches!(err[0], ValidationError::FieldTooLong { .. }));
}
#[test]
fn story_name_rejects_grammar_token() {
let err = StoryName::parse("my story </description> end").unwrap_err();
assert!(matches!(err[0], ValidationError::AntiGrammarToken { .. }));
}
#[test]
fn story_name_rejects_thinking_token() {
let err = StoryName::parse("<thinking>hello</thinking>").unwrap_err();
assert!(matches!(err[0], ValidationError::AntiGrammarToken { .. }));
}
#[test]
fn story_name_strips_html() {
let n = StoryName::parse("Hello <b>World</b>").unwrap();
assert!(!n.as_ref().contains('<'));
assert!(n.as_ref().contains("World"));
}
// --- AcceptanceCriterion ---
#[test]
fn ac_rejects_empty() {
let err = AcceptanceCriterion::parse("acceptance_criteria[0]", "").unwrap_err();
assert!(matches!(err[0], ValidationError::EmptyAfterTrim { .. }));
}
#[test]
fn ac_accepts_valid() {
let ac = AcceptanceCriterion::parse("acceptance_criteria[0]", "It works").unwrap();
assert_eq!(ac.as_ref(), "It works");
}
#[test]
fn ac_rejects_grammar_token() {
let err = AcceptanceCriterion::parse("acceptance_criteria[0]", "<tool_use>bad</tool_use>")
.unwrap_err();
assert!(matches!(err[0], ValidationError::AntiGrammarToken { .. }));
}
#[test]
fn ac_rejects_too_long() {
let long = "x".repeat(AC_MAX_LEN + 1);
let err = AcceptanceCriterion::parse("acceptance_criteria[0]", &long).unwrap_err();
assert!(matches!(err[0], ValidationError::FieldTooLong { .. }));
}
// --- Description ---
#[test]
fn description_rejects_empty() {
let err = Description::parse("description", "").unwrap_err();
assert!(matches!(err[0], ValidationError::EmptyAfterTrim { .. }));
}
#[test]
fn description_accepts_valid() {
let d = Description::parse("goal", "Achieve world peace").unwrap();
assert_eq!(d.as_str(), "Achieve world peace");
}
#[test]
fn description_rejects_grammar_token() {
let err = Description::parse("description", "text <parameter name=x> more").unwrap_err();
assert!(matches!(err[0], ValidationError::AntiGrammarToken { .. }));
}
// --- DependsOnId ---
#[test]
fn depends_on_id_rejects_zero() {
let err = DependsOnId::parse("depends_on[0]", 0).unwrap_err();
assert!(matches!(err[0], ValidationError::OutOfRange { .. }));
}
#[test]
fn depends_on_id_accepts_nonzero() {
let id = DependsOnId::parse("depends_on[0]", 42).unwrap();
assert_eq!(id.get(), 42);
}
// --- Round-trip serde ---
#[test]
fn validation_error_round_trips_json() {
let err = ValidationError::FieldTooLong {
field: "description".into(),
max: 200,
actual: 287,
};
let json = serde_json::to_string(&err).unwrap();
assert!(json.contains("FieldTooLong"));
assert!(json.contains("description"));
let back: ValidationError = serde_json::from_str(&json).unwrap();
assert_eq!(err, back);
}
}
+476
View File
@@ -0,0 +1,476 @@
//! Validated request structs for MCP write tools.
//!
//! Each struct is populated by `from_json`, which runs field-level validation via
//! the newtypes, then cross-field rules via `garde`. Callers receive either a
//! fully validated struct or a `Vec<ValidationError>` with every problem found.
use garde::Validate;
use serde_json::Value;
use super::error::{ValidationError, format_errors_as_json};
use super::newtypes::{AcceptanceCriterion, DependsOnId, Description, StoryName};
// ---------------------------------------------------------------------------
// Cross-field validators (used by garde derive)
// ---------------------------------------------------------------------------
/// Junk-only acceptance-criteria indicators — placeholders agents fill in but
/// that contain no actionable requirement.
const JUNK_AC_MARKERS: &[&str] = &["todo", "tbd", "fixme", "xxx", "???"];
fn validate_acceptance_criteria_nonempty(acs: &[AcceptanceCriterion], _ctx: &()) -> garde::Result {
if acs.is_empty() {
return Err(garde::Error::new(
"acceptance_criteria must contain at least one entry",
));
}
let all_junk = acs.iter().all(|ac| {
let lower = ac.as_ref().to_lowercase();
JUNK_AC_MARKERS.contains(&lower.trim())
});
if all_junk {
return Err(garde::Error::new(
"acceptance_criteria must contain at least one real entry (not just TODO/TBD/FIXME)",
));
}
Ok(())
}
// ---------------------------------------------------------------------------
// CreateStoryRequest
// ---------------------------------------------------------------------------
/// Fully validated inputs for the `create_story` MCP tool.
#[derive(Debug, Validate)]
pub struct CreateStoryRequest {
/// Validated story name.
#[garde(skip)]
pub name: StoryName,
/// Optional user story text.
#[garde(skip)]
pub user_story: Option<Description>,
/// Optional background description.
#[garde(skip)]
pub description: Option<Description>,
/// At least one non-junk acceptance criterion required (garde-enforced).
#[garde(custom(validate_acceptance_criteria_nonempty))]
pub acceptance_criteria: Vec<AcceptanceCriterion>,
/// Optional list of story IDs this story depends on.
#[garde(skip)]
pub depends_on: Option<Vec<DependsOnId>>,
}
impl CreateStoryRequest {
/// Parse and validate a `create_story` JSON argument map.
///
/// Runs all field-level validation and cross-field garde rules in a single
/// pass. Returns every error found, not just the first.
pub fn from_json(args: &Value) -> Result<Self, String> {
let mut errors: Vec<ValidationError> = Vec::new();
// name (required)
let name = match args.get("name").and_then(|v| v.as_str()) {
None => {
errors.push(ValidationError::FieldMissing {
field: "name".into(),
});
None
}
Some(raw) => match StoryName::parse(raw) {
Ok(n) => Some(n),
Err(mut errs) => {
errors.append(&mut errs);
None
}
},
};
// user_story (optional)
let user_story = match args.get("user_story").and_then(|v| v.as_str()) {
None => None,
Some(raw) => match Description::parse("user_story", raw) {
Ok(d) => Some(d),
Err(mut errs) => {
errors.append(&mut errs);
None
}
},
};
// description (optional)
let description = match args.get("description").and_then(|v| v.as_str()) {
None => None,
Some(raw) => match Description::parse("description", raw) {
Ok(d) => Some(d),
Err(mut errs) => {
errors.append(&mut errs);
None
}
},
};
// acceptance_criteria (required)
let acceptance_criteria = match args
.get("acceptance_criteria")
.and_then(|v| serde_json::from_value::<Vec<String>>(v.clone()).ok())
{
None => {
errors.push(ValidationError::FieldMissing {
field: "acceptance_criteria".into(),
});
None
}
Some(raw_acs) => {
let mut parsed = Vec::new();
for (i, raw) in raw_acs.iter().enumerate() {
let field = format!("acceptance_criteria[{i}]");
match AcceptanceCriterion::parse(&field, raw) {
Ok(ac) => parsed.push(ac),
Err(mut errs) => errors.append(&mut errs),
}
}
Some(parsed)
}
};
// depends_on (optional)
let depends_on: Option<Vec<DependsOnId>> =
match args.get("depends_on").and_then(|v| v.as_array()) {
None => None,
Some(arr) => {
let mut ids = Vec::new();
for (i, val) in arr.iter().enumerate() {
let field = format!("depends_on[{i}]");
match val.as_u64().map(|n| n as u32) {
None => errors.push(ValidationError::InvalidUtf8 {
field: field.clone(),
}),
Some(id) => match DependsOnId::parse(&field, id) {
Ok(d) => ids.push(d),
Err(mut errs) => errors.append(&mut errs),
},
}
}
Some(ids)
}
};
if !errors.is_empty() {
return Err(format_errors_as_json(&errors));
}
let req = CreateStoryRequest {
name: name.unwrap(),
user_story,
description,
acceptance_criteria: acceptance_criteria.unwrap(),
depends_on,
};
// Cross-field garde validation
if let Err(report) = req.validate_with(&()) {
for (_, _field_error) in report.iter() {
// Map garde errors back to typed ValidationError.
// The only garde rule here is the AC nonempty/junk check.
let actual = req.acceptance_criteria.len();
let all_junk = req.acceptance_criteria.iter().all(|ac| {
let lower = ac.as_ref().to_lowercase();
JUNK_AC_MARKERS.contains(&lower.trim())
});
if all_junk && actual > 0 {
errors.push(ValidationError::TooFewItems {
field: "acceptance_criteria".into(),
min: 1,
// Semantic "0 real entries"
actual: 0,
});
} else {
errors.push(ValidationError::TooFewItems {
field: "acceptance_criteria".into(),
min: 1,
actual,
});
}
}
return Err(format_errors_as_json(&errors));
}
Ok(req)
}
/// Extract validated `depends_on` as a plain `Vec<u32>` for downstream use.
pub fn depends_on_ids(&self) -> Option<Vec<u32>> {
self.depends_on
.as_ref()
.map(|ids| ids.iter().map(|d| d.get()).collect())
}
}
// ---------------------------------------------------------------------------
// CreateEpicRequest
// ---------------------------------------------------------------------------
/// Fully validated inputs for the `create_epic` MCP tool.
#[derive(Debug, Validate)]
pub struct CreateEpicRequest {
/// Validated epic name.
#[garde(skip)]
pub name: StoryName,
/// Validated goal statement.
#[garde(skip)]
pub goal: Description,
/// Optional motivation text.
#[garde(skip)]
pub motivation: Option<Description>,
/// Optional key files text (plain string, minimal validation).
#[garde(skip)]
pub key_files: Option<String>,
/// Optional success criteria list.
#[garde(skip)]
pub success_criteria: Option<Vec<AcceptanceCriterion>>,
}
impl CreateEpicRequest {
/// Parse and validate a `create_epic` JSON argument map.
pub fn from_json(args: &Value) -> Result<Self, String> {
let mut errors: Vec<ValidationError> = Vec::new();
// name (required)
let name = match args.get("name").and_then(|v| v.as_str()) {
None => {
errors.push(ValidationError::FieldMissing {
field: "name".into(),
});
None
}
Some(raw) => match StoryName::parse(raw) {
Ok(n) => Some(n),
Err(mut errs) => {
errors.append(&mut errs);
None
}
},
};
// goal (required)
let goal = match args.get("goal").and_then(|v| v.as_str()) {
None => {
errors.push(ValidationError::FieldMissing {
field: "goal".into(),
});
None
}
Some(raw) => match Description::parse("goal", raw) {
Ok(d) => Some(d),
Err(mut errs) => {
errors.append(&mut errs);
None
}
},
};
// motivation (optional)
let motivation = match args.get("motivation").and_then(|v| v.as_str()) {
None => None,
Some(raw) => match Description::parse("motivation", raw) {
Ok(d) => Some(d),
Err(mut errs) => {
errors.append(&mut errs);
None
}
},
};
// key_files (optional, plain string — structural markup, not user prose)
let key_files = args
.get("key_files")
.and_then(|v| v.as_str())
.map(str::trim)
.filter(|s| !s.is_empty())
.map(str::to_string);
// success_criteria (optional list)
let success_criteria = match args
.get("success_criteria")
.and_then(|v| serde_json::from_value::<Vec<String>>(v.clone()).ok())
{
None => None,
Some(raw_sc) => {
let mut parsed = Vec::new();
for (i, raw) in raw_sc.iter().enumerate() {
let field = format!("success_criteria[{i}]");
match AcceptanceCriterion::parse(&field, raw) {
Ok(ac) => parsed.push(ac),
Err(mut errs) => errors.append(&mut errs),
}
}
Some(parsed)
}
};
if !errors.is_empty() {
return Err(format_errors_as_json(&errors));
}
Ok(CreateEpicRequest {
name: name.unwrap(),
goal: goal.unwrap(),
motivation,
key_files,
success_criteria,
})
}
/// Extract success criteria as plain strings for downstream use.
pub fn success_criteria_strings(&self) -> Vec<String> {
self.success_criteria
.as_ref()
.map(|sc| sc.iter().map(|c| c.as_ref().to_string()).collect())
.unwrap_or_default()
}
}
#[cfg(test)]
mod tests {
use super::*;
use serde_json::json;
// --- CreateStoryRequest ---
#[test]
fn create_story_request_valid_minimal() {
let args = json!({
"name": "My Story",
"acceptance_criteria": ["It works"]
});
let req = CreateStoryRequest::from_json(&args).unwrap();
assert_eq!(req.name.as_ref(), "My Story");
assert_eq!(req.acceptance_criteria.len(), 1);
}
#[test]
fn create_story_request_missing_name() {
let args = json!({"acceptance_criteria": ["AC1"]});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
assert!(err.contains("FieldMissing"));
assert!(err.contains("name"));
}
#[test]
fn create_story_request_missing_acs() {
let args = json!({"name": "My Story"});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
assert!(err.contains("FieldMissing"));
assert!(err.contains("acceptance_criteria"));
}
#[test]
fn create_story_request_empty_acs() {
let args = json!({"name": "My Story", "acceptance_criteria": []});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
assert!(err.contains("TooFewItems"));
}
#[test]
fn create_story_request_all_junk_acs() {
let args = json!({"name": "My Story", "acceptance_criteria": ["TODO", "TBD"]});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
assert!(err.contains("TooFewItems"));
}
#[test]
fn create_story_request_mixed_junk_and_real() {
let args = json!({
"name": "My Story",
"acceptance_criteria": ["TODO", "Real criterion"]
});
let req = CreateStoryRequest::from_json(&args).unwrap();
assert_eq!(req.acceptance_criteria.len(), 2);
}
#[test]
fn create_story_request_grammar_token_in_name() {
let args = json!({
"name": "Story </description> bad",
"acceptance_criteria": ["AC1"]
});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
assert!(err.contains("AntiGrammarToken"));
}
#[test]
fn create_story_request_grammar_token_in_ac() {
let args = json!({
"name": "Valid Name",
"acceptance_criteria": ["<thinking>bad</thinking>"]
});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
assert!(err.contains("AntiGrammarToken"));
}
#[test]
fn create_story_request_with_all_optional_fields() {
let args = json!({
"name": "Full Story",
"user_story": "As a user I want this",
"description": "Background context",
"acceptance_criteria": ["AC1", "AC2"],
"depends_on": [1, 2, 3]
});
let req = CreateStoryRequest::from_json(&args).unwrap();
assert_eq!(req.depends_on_ids(), Some(vec![1, 2, 3]));
}
#[test]
fn create_story_request_errors_contain_json() {
let args = json!({
"name": "<thinking>bad</thinking>",
"acceptance_criteria": []
});
let err = CreateStoryRequest::from_json(&args).unwrap_err();
// Errors are JSON, parseable
let parsed: serde_json::Value = serde_json::from_str(&err).unwrap();
assert!(parsed.is_array());
}
// --- CreateEpicRequest ---
#[test]
fn create_epic_request_valid_minimal() {
let args = json!({
"name": "My Epic",
"goal": "Achieve something great"
});
let req = CreateEpicRequest::from_json(&args).unwrap();
assert_eq!(req.name.as_ref(), "My Epic");
assert_eq!(req.goal.as_str(), "Achieve something great");
}
#[test]
fn create_epic_request_missing_name() {
let args = json!({"goal": "some goal"});
let err = CreateEpicRequest::from_json(&args).unwrap_err();
assert!(err.contains("FieldMissing"));
assert!(err.contains("name"));
}
#[test]
fn create_epic_request_missing_goal() {
let args = json!({"name": "Epic"});
let err = CreateEpicRequest::from_json(&args).unwrap_err();
assert!(err.contains("FieldMissing"));
assert!(err.contains("goal"));
}
#[test]
fn create_epic_request_with_success_criteria() {
let args = json!({
"name": "My Epic",
"goal": "Achieve world peace",
"success_criteria": ["All wars end", "People prosper"]
});
let req = CreateEpicRequest::from_json(&args).unwrap();
let sc = req.success_criteria_strings();
assert_eq!(sc.len(), 2);
}
}
+67
View File
@@ -0,0 +1,67 @@
//! HTML sanitisation for user-supplied text fields.
//!
//! Uses ammonia to strip dangerous HTML tags and attributes while preserving
//! the visible text content. Sanitisation that actually fires is logged at
//! WARN so operators can spot abuse patterns.
use sha2::Digest;
use std::collections::HashSet;
/// Sanitise `value` for the named `field`.
///
/// Strips all HTML tags (keeping their text content) and removes dangerous
/// attributes. Returns `(sanitised_value, was_modified)`. When `was_modified`
/// is `true` the caller should log at WARN.
pub(super) fn sanitize_html(field: &str, value: &str) -> (String, bool) {
// Build an ammonia cleaner that allows NO tags but keeps text content.
// clear_content_tags is also set to empty so that <script>...</script>
// content is preserved as literal text rather than silently discarded.
let clean = ammonia::Builder::new()
.tags(HashSet::new())
.clean_content_tags(HashSet::new())
.clean(value)
.to_string();
let modified = clean != value;
if modified {
crate::slog_warn!(
"[validation] HTML sanitised in field '{}': fingerprint={}",
field,
fingerprint(value)
);
}
(clean, modified)
}
/// Return an 8-hex-char SHA-256 fingerprint of the input string.
fn fingerprint(input: &str) -> String {
let hash = sha2::Sha256::digest(input.as_bytes());
hash[..4].iter().map(|b| format!("{b:02x}")).collect()
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn script_tags_stripped_content_preserved() {
let (out, modified) = sanitize_html("name", "<script>alert('xss')</script>");
assert!(modified);
assert!(!out.contains("<script>"));
assert!(out.contains("alert("));
}
#[test]
fn plain_text_unchanged() {
let (out, modified) = sanitize_html("name", "Hello World");
assert!(!modified);
assert_eq!(out, "Hello World");
}
#[test]
fn on_event_stripped() {
let (out, modified) = sanitize_html("name", r#"<img onload="evil()">"#);
assert!(modified);
assert!(!out.contains("onload"));
}
}