fix: Added additional graph validation for parallel reads and writes with dependencies between nodes states

2026-05-20 17:35:33 -06:00
parent 4536d00067
commit 3c7d19da07
2 changed files with 298 additions and 0 deletions
@@ -353,6 +353,24 @@ fn single_reference_key(template: &str) -> Option<&str> {
    valid.then_some(inner)
 }

+// Returns the root state keys referenced by any `{{...}}` expressions in the
+// given template string. The "root key" is the identifier before the first
+// `.` or `[` — i.e. for `{{user.name}}` the root is `user`, for `{{items[0]}}`
+// the root is `items`. Used by the validator to compute the static read-set of
+// a node's templated fields without depending on a runtime `StateManager`.
+pub(super) fn template_root_keys(template: &str) -> Vec<String> {
+    TEMPLATE_VAR_RE
+        .captures_iter(template)
+        .flatten()
+        .filter_map(|c| c.get(1))
+        .map(|m| {
+            let inner = m.as_str();
+            let cut = inner.find(['.', '[']).unwrap_or(inner.len());
+            inner[..cut].to_string()
+        })
+        .collect()
+}
+
 fn value_to_string(value: &Value) -> String {
    match value {
        Value::String(s) => s.clone(),
@@ -1,3 +1,4 @@
+use super::state::template_root_keys;
 use super::types::{Graph, Node, NodeType};
 use crate::client::{Model, ModelType};
 use crate::config::{Agent, AppConfig, paths};
@@ -122,6 +123,7 @@ impl GraphValidator {
        self.validate_map_branches(graph, &mut result);
        self.validate_parallel_user_interaction(graph, &mut result);
        self.validate_parallel_writes(graph, &mut result);
+        self.validate_parallel_reads(graph, &mut result);

        result
    }
@@ -539,6 +541,51 @@ impl GraphValidator {
            }
        }
    }
+
+    fn validate_parallel_reads(&self, graph: &Graph, result: &mut ValidationResult) {
+        for group in compute_parallel_groups(graph) {
+            let nodes: Vec<(&String, &Node)> = group
+                .iter()
+                .filter_map(|id| graph.nodes.get(id).map(|n| (id, n)))
+                .collect();
+
+            for (id_a, node_a) in &nodes {
+                let read_set_a = read_set_of(node_a);
+                if read_set_a.is_empty() {
+                    continue;
+                }
+                for (id_b, node_b) in &nodes {
+                    if id_b == id_a {
+                        continue;
+                    }
+                    let Some(write_set_b) = write_set_of(node_b) else {
+                        continue;
+                    };
+                    let mut collisions: Vec<String> =
+                        read_set_a.intersection(&write_set_b).cloned().collect();
+                    if collisions.is_empty() {
+                        continue;
+                    }
+                    collisions.sort();
+                    let keys = collisions
+                        .iter()
+                        .map(|k| format!("`{k}`"))
+                        .collect::<Vec<_>>()
+                        .join(", ");
+                    result.error(ValidationError::with_node(
+                        id_a.as_str(),
+                        format!(
+                            "node '{id_a}' reads state key(s) {keys} which sibling parallel \
+                             branch '{id_b}' writes in the same super-step; parallel branches \
+                             see a state snapshot taken BEFORE the super-step and cannot observe \
+                             each other's writes. Move the dependent read to a later super-step \
+                             (or remove the cross-branch reference)."
+                        ),
+                    ));
+                }
+            }
+        }
+    }
 }

 fn declared_targets(node: &Node) -> Vec<(String, &'static str)> {
@@ -646,6 +693,103 @@ fn write_set_of(node: &Node) -> Option<HashSet<String>> {
    Some(writes)
 }

+// Computes the set of root state keys this node's templated fields read from.
+//
+// "Root key" follows the same definition as `template_root_keys`: for a
+// reference like `{{user.name}}` or `{{items[0]}}`, the root is the bare
+// identifier before the first `.` or `[`.
+//
+// Templated fields scanned per node type:
+//   - llm:      instructions, prompt, state_updates values
+//   - agent:    prompt, state_updates values
+//   - rag:      query (defaulting to "{{initial_prompt}}"), state_updates values
+//   - approval: question, state_updates values
+//   - input:    question, default, state_updates values
+//   - end:      output, state_updates values
+//   - map:      over (its `{{...}}` IS the dynamic read of the list to fan out over)
+//   - script:   state_updates values only (the script body is opaque to static
+//               analysis; its reads via GRAPH_STATE / GRAPH_STATE_FILE can't be
+//               inferred at load time)
+//
+// Scoped variables produced by THIS node's own execution are excluded from
+// state_updates value scanning:
+//   - llm/agent/rag → "output" (the node's body output)
+//   - approval      → "choice" (the user's selected option)
+//   - input         → "input"  (the user's typed text)
+// These are bindings created inside the node, not reads from prior state, so
+// they cannot race with a sibling's writes.
+fn read_set_of(node: &Node) -> HashSet<String> {
+    let mut reads: HashSet<String> = HashSet::new();
+    let scoped: &[&str] = match &node.node_type {
+        NodeType::Llm(_) | NodeType::Agent(_) | NodeType::Rag(_) => &["output"],
+        NodeType::Approval(_) => &["choice"],
+        NodeType::Input(_) => &["input"],
+        NodeType::Script(_) | NodeType::End(_) | NodeType::Map(_) => &[],
+    };
+
+    for s in primary_templated_fields(node) {
+        for k in template_root_keys(&s) {
+            reads.insert(k);
+        }
+    }
+
+    if let Some(updates) = node_state_updates_map(node) {
+        for v in updates.values() {
+            for k in template_root_keys(v) {
+                if !scoped.contains(&k.as_str()) {
+                    reads.insert(k);
+                }
+            }
+        }
+    }
+
+    reads
+}
+
+fn primary_templated_fields(node: &Node) -> Vec<String> {
+    match &node.node_type {
+        NodeType::Llm(n) => {
+            let mut v = vec![n.prompt.clone()];
+            if let Some(i) = &n.instructions {
+                v.push(i.clone());
+            }
+            v
+        }
+        NodeType::Agent(n) => vec![n.prompt.clone()],
+        NodeType::Rag(n) => {
+            vec![
+                n.query
+                    .clone()
+                    .unwrap_or_else(|| "{{initial_prompt}}".to_string()),
+            ]
+        }
+        NodeType::Approval(n) => vec![n.question.clone()],
+        NodeType::Input(n) => {
+            let mut v = vec![n.question.clone()];
+            if let Some(d) = &n.default {
+                v.push(d.clone());
+            }
+            v
+        }
+        NodeType::End(n) => vec![n.output.clone()],
+        NodeType::Map(n) => vec![n.over.clone()],
+        NodeType::Script(_) => Vec::new(),
+    }
+}
+
+fn node_state_updates_map(node: &Node) -> Option<&std::collections::HashMap<String, String>> {
+    match &node.node_type {
+        NodeType::Llm(n) => n.state_updates.as_ref(),
+        NodeType::Agent(n) => n.state_updates.as_ref(),
+        NodeType::Rag(n) => n.state_updates.as_ref(),
+        NodeType::Approval(n) => n.state_updates.as_ref(),
+        NodeType::Input(n) => n.state_updates.as_ref(),
+        NodeType::Script(n) => n.state_updates.as_ref(),
+        NodeType::End(n) => n.state_updates.as_ref(),
+        NodeType::Map(_) => None,
+    }
+}
+
 fn node_state_updates_keys(node: &Node) -> Option<HashSet<String>> {
    let updates = match &node.node_type {
        NodeType::Agent(n) => n.state_updates.as_ref(),
@@ -2064,4 +2208,140 @@ mod tests {
            result.errors
        );
    }
+
+    fn llm_with_prompt(id: &str, prompt: &str, next: Option<&str>) -> Node {
+        let mut node = llm_node(id, None, next);
+        if let NodeType::Llm(ref mut n) = node.node_type {
+            n.prompt = prompt.into();
+        }
+        node
+    }
+
+    #[test]
+    fn parallel_read_of_sibling_write_errors() {
+        let reader = llm_with_prompt("worker_a", "Hello {{summary}}!", Some("end"));
+        let writer = llm_with_state_updates("worker_b", &[("summary", "static")], Some("end"));
+        let graph = fan_out_graph_with_two_workers(reader, writer);
+
+        let result = validator().validate(&graph);
+
+        assert!(
+            result
+                .errors
+                .iter()
+                .any(|e| e.message.contains("reads state key(s) `summary`")
+                    && e.message.contains("'worker_b'")),
+            "expected cross-branch read error mentioning `summary` and sibling writer: {:?}",
+            result.errors
+        );
+    }
+
+    #[test]
+    fn parallel_read_of_upstream_key_passes() {
+        let reader_a = llm_with_prompt("worker_a", "Topic is {{topic}}", Some("end"));
+        let reader_b = llm_with_prompt("worker_b", "Also {{topic}}", Some("end"));
+        let graph = fan_out_graph_with_two_workers(reader_a, reader_b);
+
+        let result = validator().validate(&graph);
+
+        assert!(
+            !result
+                .errors
+                .iter()
+                .any(|e| e.message.contains("reads state key")),
+            "upstream `topic` shouldn't trigger cross-branch read error: {:?}",
+            result.errors
+        );
+    }
+
+    #[test]
+    fn scoped_output_var_in_state_updates_not_treated_as_read() {
+        let scoped_user =
+            llm_with_state_updates("worker_a", &[("a_key", "{{output}}")], Some("end"));
+        let writes_output =
+            llm_with_state_updates("worker_b", &[("output", "{{output}}")], Some("end"));
+        let graph = fan_out_graph_with_two_workers(scoped_user, writes_output);
+
+        let result = validator().validate(&graph);
+
+        assert!(
+            !result
+                .errors
+                .iter()
+                .any(|e| e.message.contains("reads state key(s) `output`")
+                    && e.message.contains("worker_a")),
+            "scoped `{{{{output}}}}` inside state_updates value should NOT be treated as a read: {:?}",
+            result.errors
+        );
+    }
+
+    #[test]
+    fn rag_query_reading_sibling_script_write_errors() {
+        let mut rag = rag_node("worker_a", &["./k"], true);
+        if let NodeType::Rag(ref mut n) = rag.node_type {
+            n.query = Some("codes: {{loinc_codes}}\n{{db_result}}".into());
+            if let Some(m) = n.state_updates.as_mut() {
+                m.insert("rag_ctx".into(), "{{output.context}}".into());
+            }
+        }
+        rag.next = Some("end".into());
+        let mut script = script_with_state_updates("worker_b", &[("db_result", "{{output}}")]);
+        script.next = Some("end".into());
+        let graph = fan_out_graph_with_two_workers(rag, script);
+
+        let result = validator().validate(&graph);
+
+        assert!(
+            result
+                .errors
+                .iter()
+                .any(|e| e.message.contains("reads state key(s) `db_result`")
+                    && e.message.contains("'worker_b'")),
+            "expected cross-branch read error for rag query reading db_result: {:?}",
+            result.errors
+        );
+    }
+
+    #[test]
+    fn map_over_reading_sibling_write_errors() {
+        let map_n = Node {
+            id: "fan".into(),
+            description: String::new(),
+            node_type: NodeType::Map(MapNode {
+                over: "{{items}}".into(),
+                as_name: "item".into(),
+                branch: "branch_n".into(),
+                output_key: "output".into(),
+                collect_into: "results".into(),
+                max_concurrency: None,
+            }),
+            next: Some("end".into()),
+        };
+        let branch_n = llm_with_prompt("branch_n", "Process {{item}}", None);
+        let producer = llm_with_state_updates("producer", &[("items", "[1,2,3]")], Some("end"));
+        let mut start = end_node("start");
+        start.next = Some(NextTargets::Many(vec!["fan".into(), "producer".into()]));
+        let graph = graph_with(
+            vec![
+                ("start", start),
+                ("fan", map_n),
+                ("branch_n", branch_n),
+                ("producer", producer),
+                ("end", end_node("end")),
+            ],
+            "start",
+        );
+
+        let result = validator().validate(&graph);
+
+        assert!(
+            result
+                .errors
+                .iter()
+                .any(|e| e.message.contains("reads state key(s) `items`")
+                    && e.message.contains("'producer'")),
+            "expected cross-branch read error for map `over` reading sibling write: {:?}",
+            result.errors
+        );
+    }
 }