test(parity): lock clean JSON prompt transport output

PARITY.md still claimed tool-capable JSON prompt runs leaked human-readable tool result lines, but a local mock SSE reproduction showed stdout already stays transport-clean. Add a real CLI regression test around the binary prompt path and update the parity note so future work does not chase a stale bug report. Constraint: Keep scope limited to JSON prompt parity and leave the existing README Philosophy edits untouched Rejected: Modify claw-cli transport code | current behavior already verified clean via a mock SSE prompt run Confidence: high Scope-risk: narrow Reversibility: clean Directive: Keep prompt JSON stdout parseable as a single transport object even when tool loops fire Tested: cargo test -p claw-cli prompt_json_with_tool_use_writes_clean_transport_output --test prompt_json_transport -- --nocapture Tested: cargo test -p claw-cli parses_bare_prompt_and_json_output_flag -- --nocapture Tested: cargo test -p claw-cli response_to_events_preserves_empty_object_json_input_outside_streaming -- --nocapture Not-tested: Live provider behavior outside the local mock SSE harness
2026-04-05 16:39:04 +08:00 · 2026-04-01 23:15:15 +00:00
parent bcaf6e0771
commit 06ee5a2dc4
2 changed files with 303 additions and 4 deletions
--- a/PARITY.md
+++ b/PARITY.md
@@ -137,7 +137,7 @@ Evidence:
 - Missing major TS command families: `/agents`, `/hooks`, `/mcp`, `/plugin`, `/skills`, `/plan`, `/review`, `/tasks`, and many others.
 - No Rust equivalent to TS structured IO / remote transport layers.
 - No TS-style handler decomposition for auth/plugins/MCP/agents.
- JSON prompt mode is improved on this branch, but still not clean transport parity: empirical verification shows tool-capable JSON output can emit human-readable tool-result lines before the final JSON object.
+- JSON prompt mode now maintains clean transport output in tool-capable runs; targeted CLI coverage should guard against regressions.

 **Status:** functional local CLI core, much narrower than TS.

@@ -161,7 +161,7 @@ Evidence:
 - No TS-style hook-aware orchestration layer.
 - No TS structured/remote assistant transport stack.
 - No richer TS assistant/session-history/background-task integration.
- JSON output path is no longer single-turn only on this branch, but output cleanliness still lags TS transport expectations.
+- JSON output path is no longer single-turn only on this branch, and tool-capable prompt output now stays transport-clean like the TypeScript behavior.

 **Status:** strong core loop, missing orchestration layers.

@@ -209,6 +209,6 @@ Evidence:
 - **Unlimited max_iterations**
  - Verified at `rust/crates/runtime/src/conversation.rs` with `usize::MAX`.

-### Remaining notable parity issue
+### JSON prompt output cleanliness status
 - **JSON prompt output cleanliness**
-  - Tool-capable JSON mode now loops, but empirical verification still shows pre-JSON human-readable tool-result output when tools fire.
+  - Verified clean in tool-capable prompt mode: stdout remains a single final JSON object when tools fire.
--- a/rust/crates/claw-cli/tests/prompt_json_transport.rs
+++ b/rust/crates/claw-cli/tests/prompt_json_transport.rs
@@ -0,0 +1,299 @@
+use std::fs;
+use std::io::{Read, Write};
+use std::net::TcpListener;
+use std::path::PathBuf;
+use std::process::Command;
+use std::thread;
+use std::time::{Duration, Instant, SystemTime, UNIX_EPOCH};
+
+use serde_json::{json, Value};
+
+#[test]
+fn prompt_json_with_tool_use_writes_clean_transport_output() {
+    let fixture_root = unique_temp_dir("claw-json-transport");
+    fs::create_dir_all(&fixture_root).expect("create fixture root");
+    fs::write(fixture_root.join("fixture.txt"), "fixture contents\n").expect("write fixture file");
+    fs::create_dir_all(fixture_root.join("config")).expect("create config dir");
+
+    let server = TestServer::spawn(vec![
+        sse_response(
+            "req_tool",
+            &tool_use_stream("read_file", json!({ "path": "fixture.txt" })),
+        ),
+        sse_response("req_done", &text_stream("done")),
+    ]);
+
+    let output = Command::new(env!("CARGO_BIN_EXE_claw"))
+        .current_dir(&fixture_root)
+        .env("ANTHROPIC_BASE_URL", server.base_url())
+        .env("ANTHROPIC_API_KEY", "test-key")
+        .env("CLAW_CONFIG_HOME", fixture_root.join("config"))
+        .arg("--output-format")
+        .arg("json")
+        .arg("prompt")
+        .arg("use a tool")
+        .output()
+        .expect("run claw prompt json");
+
+    server.finish();
+
+    let stdout = String::from_utf8(output.stdout).expect("stdout should be utf8");
+    let stderr = String::from_utf8(output.stderr).expect("stderr should be utf8");
+
+    assert!(
+        output.status.success(),
+        "status: {:?}\nstderr:\n{stderr}",
+        output.status
+    );
+    assert!(stderr.trim().is_empty(), "unexpected stderr: {stderr}");
+    assert!(
+        stdout.trim_start().starts_with('{'),
+        "stdout should begin with JSON object, got:\n{stdout}"
+    );
+
+    let parsed: Value = serde_json::from_str(stdout.trim())
+        .expect("full stdout should be a single parseable JSON object");
+
+    assert_eq!(parsed["message"], "done");
+    assert_eq!(parsed["iterations"], 2);
+    assert_eq!(parsed["tool_uses"].as_array().map(Vec::len), Some(1));
+    assert_eq!(parsed["tool_results"].as_array().map(Vec::len), Some(1));
+    assert_eq!(parsed["tool_uses"][0]["name"], "read_file");
+    assert_eq!(parsed["tool_results"][0]["tool_name"], "read_file");
+    assert_eq!(parsed["tool_results"][0]["is_error"], false);
+
+    let tool_output = parsed["tool_results"][0]["output"]
+        .as_str()
+        .expect("tool result output string");
+    assert!(tool_output.contains("fixture contents"));
+    assert!(
+        !stdout.contains("📄 Read"),
+        "stdout leaked human-readable tool rendering:\n{stdout}"
+    );
+}
+
+struct TestServer {
+    base_url: String,
+    join_handle: thread::JoinHandle<()>,
+}
+
+impl TestServer {
+    fn spawn(responses: Vec<String>) -> Self {
+        let listener = TcpListener::bind("127.0.0.1:0").expect("bind listener");
+        listener
+            .set_nonblocking(true)
+            .expect("set nonblocking listener");
+        let address = listener.local_addr().expect("listener addr");
+        let join_handle = thread::spawn(move || {
+            let deadline = Instant::now() + Duration::from_secs(10);
+            let mut served = 0usize;
+
+            while served < responses.len() && Instant::now() < deadline {
+                match listener.accept() {
+                    Ok((mut stream, _)) => {
+                        drain_http_request(&mut stream);
+                        stream
+                            .write_all(responses[served].as_bytes())
+                            .expect("write response");
+                        served += 1;
+                    }
+                    Err(error) if error.kind() == std::io::ErrorKind::WouldBlock => {
+                        thread::sleep(Duration::from_millis(10));
+                    }
+                    Err(error) => panic!("accept failed: {error}"),
+                }
+            }
+
+            assert_eq!(
+                served,
+                responses.len(),
+                "server did not observe expected request count"
+            );
+        });
+
+        Self {
+            base_url: format!("http://{address}"),
+            join_handle,
+        }
+    }
+
+    fn base_url(&self) -> &str {
+        &self.base_url
+    }
+
+    fn finish(self) {
+        self.join_handle.join().expect("join server thread");
+    }
+}
+
+fn drain_http_request(stream: &mut std::net::TcpStream) {
+    stream
+        .set_read_timeout(Some(Duration::from_secs(5)))
+        .expect("set read timeout");
+    let mut buffer = Vec::new();
+    let mut header_end = None;
+
+    while header_end.is_none() {
+        let mut chunk = [0_u8; 1024];
+        let read = stream.read(&mut chunk).expect("read request chunk");
+        if read == 0 {
+            break;
+        }
+        buffer.extend_from_slice(&chunk[..read]);
+        header_end = find_header_end(&buffer);
+    }
+
+    let header_end = header_end.expect("request should contain headers");
+    let headers = String::from_utf8(buffer[..header_end].to_vec()).expect("header utf8");
+    let content_length = headers
+        .lines()
+        .find_map(|line| {
+            line.split_once(':').and_then(|(name, value)| {
+                name.eq_ignore_ascii_case("content-length")
+                    .then(|| value.trim().parse::<usize>().expect("content length"))
+            })
+        })
+        .unwrap_or(0);
+    let mut body = buffer[(header_end + 4)..].to_vec();
+    while body.len() < content_length {
+        let mut chunk = vec![0_u8; content_length - body.len()];
+        let read = stream.read(&mut chunk).expect("read request body");
+        if read == 0 {
+            break;
+        }
+        body.extend_from_slice(&chunk[..read]);
+    }
+}
+
+fn find_header_end(buffer: &[u8]) -> Option<usize> {
+    buffer.windows(4).position(|window| window == b"\r\n\r\n")
+}
+
+fn sse_response(request_id: &str, body: &str) -> String {
+    format!(
+        "HTTP/1.1 200 OK\r\nContent-Type: text/event-stream\r\nrequest-id: {request_id}\r\nContent-Length: {}\r\nConnection: close\r\n\r\n{body}",
+        body.len()
+    )
+}
+
+fn tool_use_stream(tool_name: &str, input: Value) -> String {
+    let mut body = String::new();
+    body.push_str(&sse_event(
+        "message_start",
+        json!({
+            "type": "message_start",
+            "message": {
+                "id": "msg_tool",
+                "type": "message",
+                "role": "assistant",
+                "content": [],
+                "model": "claude-opus-4-6",
+                "stop_reason": null,
+                "stop_sequence": null,
+                "usage": {"input_tokens": 8, "output_tokens": 0}
+            }
+        }),
+    ));
+    body.push_str(&sse_event(
+        "content_block_start",
+        json!({
+            "type": "content_block_start",
+            "index": 0,
+            "content_block": {
+                "type": "tool_use",
+                "id": "toolu_1",
+                "name": tool_name,
+                "input": {}
+            }
+        }),
+    ));
+    body.push_str(&sse_event(
+        "content_block_delta",
+        json!({
+            "type": "content_block_delta",
+            "index": 0,
+            "delta": {
+                "type": "input_json_delta",
+                "partial_json": input.to_string()
+            }
+        }),
+    ));
+    body.push_str(&sse_event(
+        "content_block_stop",
+        json!({"type": "content_block_stop", "index": 0}),
+    ));
+    body.push_str(&sse_event(
+        "message_delta",
+        json!({
+            "type": "message_delta",
+            "delta": {"stop_reason": "tool_use", "stop_sequence": null},
+            "usage": {"input_tokens": 8, "output_tokens": 1}
+        }),
+    ));
+    body.push_str(&sse_event("message_stop", json!({"type": "message_stop"})));
+    body.push_str("data: [DONE]\n\n");
+    body
+}
+
+fn text_stream(text: &str) -> String {
+    let mut body = String::new();
+    body.push_str(&sse_event(
+        "message_start",
+        json!({
+            "type": "message_start",
+            "message": {
+                "id": "msg_done",
+                "type": "message",
+                "role": "assistant",
+                "content": [],
+                "model": "claude-opus-4-6",
+                "stop_reason": null,
+                "stop_sequence": null,
+                "usage": {"input_tokens": 20, "output_tokens": 0}
+            }
+        }),
+    ));
+    body.push_str(&sse_event(
+        "content_block_start",
+        json!({
+            "type": "content_block_start",
+            "index": 0,
+            "content_block": {"type": "text", "text": ""}
+        }),
+    ));
+    body.push_str(&sse_event(
+        "content_block_delta",
+        json!({
+            "type": "content_block_delta",
+            "index": 0,
+            "delta": {"type": "text_delta", "text": text}
+        }),
+    ));
+    body.push_str(&sse_event(
+        "content_block_stop",
+        json!({"type": "content_block_stop", "index": 0}),
+    ));
+    body.push_str(&sse_event(
+        "message_delta",
+        json!({
+            "type": "message_delta",
+            "delta": {"stop_reason": "end_turn", "stop_sequence": null},
+            "usage": {"input_tokens": 20, "output_tokens": 2}
+        }),
+    ));
+    body.push_str(&sse_event("message_stop", json!({"type": "message_stop"})));
+    body.push_str("data: [DONE]\n\n");
+    body
+}
+
+fn sse_event(event_name: &str, payload: Value) -> String {
+    format!("event: {event_name}\ndata: {payload}\n\n")
+}
+
+fn unique_temp_dir(prefix: &str) -> PathBuf {
+    let nanos = SystemTime::now()
+        .duration_since(UNIX_EPOCH)
+        .expect("clock should be after epoch")
+        .as_nanos();
+    std::env::temp_dir().join(format!("{prefix}-{nanos}"))
+}