fix(chat): harden bridge_save/agentic_resume against empty and corrupt state
Neuron Soul CI / build (pull_request) Failing after 8m44s

BLOCKER 1: use untyped reassignment (let x = ...) for the fallback bindings
in agentic_resume instead of re-declaring typed let bindings (let x: Type = ...)
for the same variable in the same scope. The typed form risks shadowing semantics
that differ from the established pattern used everywhere else in the loop
(e.g. agentic_loop line 720).

BLOCKER 2: add empty-string guards in both bridge_save and agentic_resume.
bridge_save now returns false without writing state if messages or tools_json
is empty — preventing syntactically invalid JSON blobs. agentic_resume now
returns an error envelope after the fallback resolution if either field is
still empty, rather than passing empty strings into agentic_loop which would
silently start a fresh turn with no context.

Also add tests:
- test_bridge_serialization.el: covers bridge_save empty-guard, golden-path
  raw-JSON round-trip, agentic_resume unknown/corrupt/missing-fields paths,
  and legacy string-escaped fallback path
- test_sessions_routes.el: covers DELETE and PATCH /api/sessions/:id routes
  (valid args, unknown id, empty body) and GET /api/sessions regression after
  removal of the duplicate route_sessions() handler
This commit is contained in:
2026-06-17 12:59:13 -05:00
parent 644d9915bf
commit 459a9cbff2
3 changed files with 442 additions and 2 deletions
+14 -2
View File
@@ -766,6 +766,12 @@ fn agentic_loop(session_id: String, model: String, safe_sys: String, tools_json:
// stored `messages` already includes the assistant turn that requested the tool, so
// resume just appends the client's tool_result for `tool_use_id`.
fn bridge_save(session_id: String, model: String, safe_sys: String, tools_json: String, messages: String, tools_log: String, tool_use_id: String) -> Bool {
// Guard: empty messages or tools_json would produce syntactically invalid JSON.
// Return false so the caller detects the failure rather than writing a corrupt
// blob that agentic_resume would later resume with no context.
if str_eq(messages, "") || str_eq(tools_json, "") {
return false
}
// messages and tools_json are already well-formed JSON arrays; embed them as raw
// JSON values (not string-escaped) so the round-trip through state_get/json_get_raw
// never corrupts nested quotes. Scalar strings (model, safe_sys, tools_log,
@@ -796,9 +802,15 @@ fn agentic_resume(session_id: String, tool_use_id: String, content: String) -> S
// messages_raw and tools_raw are embedded as raw JSON (not string-escaped);
// fall back to legacy string-escaped fields for sessions saved before this fix.
let messages: String = json_get_raw(blob, "messages_raw")
let messages: String = if str_eq(messages, "") { json_get(blob, "messages") } else { messages }
let messages = if str_eq(messages, "") { json_get(blob, "messages") } else { messages }
let tools_json: String = json_get_raw(blob, "tools_raw")
let tools_json: String = if str_eq(tools_json, "") { json_get(blob, "tools_json") } else { tools_json }
let tools_json = if str_eq(tools_json, "") { json_get(blob, "tools_json") } else { tools_json }
// Guard: a corrupt or missing bridge blob (e.g. state cleared mid-flight)
// yields empty messages/tools. Return an error envelope rather than resuming
// with no context, which would cause the model to start a fresh turn.
if str_eq(messages, "") || str_eq(tools_json, "") {
return "{\"error\":\"corrupt bridge state\",\"reply\":\"\"}"
}
let tools_log: String = json_get(blob, "tools_log")
let saved_use_id: String = json_get(blob, "tool_use_id")
+257
View File
@@ -0,0 +1,257 @@
// test_bridge_serialization.el
//
// Tests for PR #20 fix/bridge-save-serialization:
// - bridge_save raw JSON serialization (BLOCKER 1 & 2 regression guards)
// - agentic_resume error-path handling
// - Legacy fallback: old string-escaped fields still readable
// - Corrupt/missing bridge state error envelope
// - Empty messages/tools_json guard in bridge_save
//
// What CANNOT be tested here without a live Anthropic API:
// - agentic_resume golden-path (calls agentic_loop which hits the API)
// - Full save/resume round-trip with a real tool_result
//
// To run:
// elc chat.el && ./soul --test tests/test_bridge_serialization.el
//
//
import "../chat.el"
// Test harness
let pass_count: Int = 0
let fail_count: Int = 0
fn assert_eq(label: String, got: String, expected: String) -> Void {
if str_eq(got, expected) {
let pass_count = pass_count + 1
println(" PASS: " + label)
} else {
let fail_count = fail_count + 1
println(" FAIL: " + label)
println(" got: " + got)
println(" expected: " + expected)
}
}
fn assert_true(label: String, cond: Bool) -> Void {
if cond {
let pass_count = pass_count + 1
println(" PASS: " + label)
} else {
let fail_count = fail_count + 1
println(" FAIL: " + label)
}
}
fn assert_false(label: String, cond: Bool) -> Void {
assert_true(label, !cond)
}
fn assert_contains(label: String, haystack: String, needle: String) -> Void {
if str_contains(haystack, needle) {
let pass_count = pass_count + 1
println(" PASS: " + label)
} else {
let fail_count = fail_count + 1
println(" FAIL: " + label)
println(" missing '" + needle + "' in: " + haystack)
}
}
fn assert_not_contains(label: String, haystack: String, needle: String) -> Void {
if str_contains(haystack, needle) {
let fail_count = fail_count + 1
println(" FAIL: " + label)
println(" unexpected '" + needle + "' found in: " + haystack)
} else {
let pass_count = pass_count + 1
println(" PASS: " + label)
}
}
fn assert_not_empty(label: String, s: String) -> Void {
if str_eq(s, "") {
let fail_count = fail_count + 1
println(" FAIL: " + label + " (got empty string)")
} else {
let pass_count = pass_count + 1
println(" PASS: " + label)
}
}
// Section 1: bridge_save empty messages guard
//
// BLOCKER 2 regression guard: bridge_save must refuse to write a blob when
// messages or tools_json is empty, as the resulting JSON would be syntactically
// invalid (bare colon with no value).
println("")
println("1. bridge_save — empty messages guard")
let sid1: String = "test-session-empty-messages"
state_set("mcp_bridge:" + sid1, "")
let save1_ok: Bool = bridge_save(sid1, "claude-sonnet-4-5", "sys", "[]", "", "", "call-1")
assert_false("empty messages -> bridge_save returns false", save1_ok)
let saved1: String = state_get("mcp_bridge:" + sid1)
assert_eq("empty messages -> no blob written to state", saved1, "")
// Section 2: bridge_save empty tools_json guard
println("")
println("2. bridge_save — empty tools_json guard")
let sid2: String = "test-session-empty-tools"
state_set("mcp_bridge:" + sid2, "")
let save2_ok: Bool = bridge_save(sid2, "claude-sonnet-4-5", "sys", "", "[{\"role\":\"user\",\"content\":\"hi\"}]", "", "call-2")
assert_false("empty tools_json -> bridge_save returns false", save2_ok)
let saved2: String = state_get("mcp_bridge:" + sid2)
assert_eq("empty tools_json -> no blob written to state", saved2, "")
// Section 3: bridge_save golden path writes raw JSON fields
//
// Verifies that messages_raw and tools_raw are stored as inline JSON (not
// string-escaped) so that json_get_raw retrieves them without corruption.
println("")
println("3. bridge_save — golden path writes messages_raw and tools_raw as raw JSON")
let sid3: String = "test-session-golden"
state_set("mcp_bridge:" + sid3, "")
let msgs3: String = "[{\"role\":\"user\",\"content\":\"hello\"}]"
let tools3: String = "[{\"name\":\"read_file\"}]"
let save3_ok: Bool = bridge_save(sid3, "claude-sonnet-4-5", "You are a helper.", tools3, msgs3, "read_file", "toolu_abc")
assert_true("valid args -> bridge_save returns true", save3_ok)
let blob3: String = state_get("mcp_bridge:" + sid3)
assert_not_empty("valid args -> blob written to state", blob3)
// messages_raw should be stored as a raw JSON array (not a quoted string)
// so json_get_raw on the blob returns the array directly
let raw_msgs3: String = json_get_raw(blob3, "messages_raw")
assert_contains("messages_raw field present in blob", blob3, "messages_raw")
assert_eq("messages_raw round-trips without corruption", raw_msgs3, msgs3)
let raw_tools3: String = json_get_raw(blob3, "tools_raw")
assert_eq("tools_raw round-trips without corruption", raw_tools3, tools3)
// Scalar fields should still be present as normal string-escaped JSON fields
let model3: String = json_get(blob3, "model")
assert_eq("model field preserved in blob", model3, "claude-sonnet-4-5")
let tool_use_id3: String = json_get(blob3, "tool_use_id")
assert_eq("tool_use_id field preserved in blob", tool_use_id3, "toolu_abc")
// Verify the blob does NOT contain old-style double-escaped fields
assert_not_contains("no legacy 'messages' string field in new-format blob", blob3, "\"messages\":\"")
assert_not_contains("no legacy 'tools_json' string field in new-format blob", blob3, "\"tools_json\":\"")
// Section 4: agentic_resume unknown session_id returns error envelope
println("")
println("4. agentic_resume — unknown session_id (empty state)")
let sid4: String = "test-session-unknown-xyzzy"
state_set("mcp_bridge:" + sid4, "")
let resume4: String = agentic_resume(sid4, "toolu_xyz", "some result")
assert_contains("unknown session_id -> error field present", resume4, "\"error\"")
assert_contains("unknown session_id -> reply field present", resume4, "\"reply\"")
assert_contains("unknown session_id -> 'unknown session_id' message", resume4, "unknown session_id")
let reply4: String = json_get(resume4, "reply")
assert_eq("unknown session_id -> reply is empty string", reply4, "")
// Section 5: agentic_resume syntactically invalid JSON in state
println("")
println("5. agentic_resume — syntactically invalid JSON blob in state")
let sid5: String = "test-session-corrupt-json"
// Write a non-JSON value that state_get would return as-is
state_set("mcp_bridge:" + sid5, "NOT_JSON_AT_ALL")
let resume5: String = agentic_resume(sid5, "toolu_xyz", "some result")
// The function may take multiple paths here; in all cases it must not crash and
// must return a JSON envelope with at least an error or empty reply field.
// When json_get_raw returns "" on unparseable input, the guard catches it.
assert_contains("corrupt JSON blob -> resume returns JSON", resume5, "\"reply\"")
// Section 6: agentic_resume blob with no messages produces error envelope
println("")
println("6. agentic_resume — blob missing messages_raw and messages fields")
let sid6: String = "test-session-no-messages"
// Blob with only model/safe_sys no messages or tools
state_set("mcp_bridge:" + sid6, "{\"model\":\"claude-sonnet-4-5\",\"safe_sys\":\"sys\",\"tool_use_id\":\"toolu_abc\"}")
let resume6: String = agentic_resume(sid6, "toolu_abc", "result")
assert_contains("missing messages -> error field present", resume6, "\"error\"")
assert_contains("missing messages -> error mentions corrupt state", resume6, "corrupt bridge state")
let reply6: String = json_get(resume6, "reply")
assert_eq("missing messages -> reply is empty string", reply6, "")
// Section 7: Legacy fallback old-format blob (string-escaped fields)
//
// BLOCKER 1 regression guard: sessions saved before the fix used 'messages'
// and 'tools_json' as string-escaped fields. The fallback path in agentic_resume
// must read them correctly. We verify the fallback resolves the correct values
// before the function reaches the api call (which we cannot make in tests).
//
// We test the fallback by writing a legacy blob and verifying that
// agentic_resume does NOT return the "corrupt bridge state" error
// (which would mean the fallback is broken), instead it gets past the guard
// and then fails on the API call (outside our test scope).
//
// NOTE: We cannot confirm a successful API-dependent round-trip in this test;
// the goal is only to confirm the state-reading fallback path resolves values.
println("")
println("7. Legacy fallback — old-format blob with string-escaped 'messages' field")
let sid7: String = "test-session-legacy-format"
// Simulate an old-format blob: messages and tools_json as json_safe-escaped strings.
// json_safe escapes " to \" so the stored value is a JSON string containing the array.
let legacy_msgs: String = "[{\"role\":\"user\",\"content\":\"legacy hello\"}]"
let legacy_tools: String = "[{\"name\":\"read_file\"}]"
// Build the blob the OLD way: string-escaped
let safe_msgs: String = json_safe(legacy_msgs)
let safe_tools: String = json_safe(legacy_tools)
let legacy_blob: String = "{\"model\":\"claude-sonnet-4-5\",\"safe_sys\":\"sys\",\"messages\":\"" + safe_msgs + "\",\"tools_json\":\"" + safe_tools + "\",\"tool_use_id\":\"toolu_legacy\"}"
state_set("mcp_bridge:" + sid7, legacy_blob)
let resume7: String = agentic_resume(sid7, "toolu_legacy", "legacy result")
// The fallback should successfully read the fields and NOT return "corrupt bridge state"
assert_not_contains("legacy blob -> no 'corrupt bridge state' error (fallback working)", resume7, "corrupt bridge state")
// It will fail on API call in test env, but should get past the state-reading guard
// Accept "unknown session_id" NOT happening - the blob was found, just API fails
// ── Section 8: bridge_save with tool_use_id containing special chars ──────────
println("")
println("8. bridge_save tool_use_id with JSON-special characters is escaped")
let sid8: String = "test-session-special-chars"
state_set("mcp_bridge:" + sid8, "")
let special_id: String = "toolu_test\"quoted\""
let msgs8: String = "[{\"role\":\"user\",\"content\":\"hi\"}]"
let tools8: String = "[{\"name\":\"read_file\"}]"
let save8_ok: Bool = bridge_save(sid8, "claude-sonnet-4-5", "sys", tools8, msgs8, "", special_id)
assert_true("special chars in tool_use_id -> bridge_save returns true", save8_ok)
let blob8: String = state_get("mcp_bridge:" + sid8)
// The blob must be parseable (json_get succeeds on it)
let retrieved_id: String = json_get(blob8, "tool_use_id")
assert_eq("tool_use_id with quotes round-trips via json_safe", retrieved_id, special_id)
// ── Summary ────────────────────────────────────────────────────────────────────
println("")
println("test_bridge_serialization.el: " + int_to_str(pass_count) + " passed, " + int_to_str(fail_count) + " failed")
+171
View File
@@ -0,0 +1,171 @@
// test_sessions_routes.el
//
// Tests for PR #20 fix/bridge-save-serialization sessions and routes layer:
//
// Covers:
// - DELETE /api/sessions/:id with valid/unknown session_id
// - PATCH /api/sessions/:id with title/folder fields
// - PATCH /api/sessions/:id with unknown id and missing fields
// - GET /api/sessions regression: session_list() returns after removal of
// duplicate route_sessions() handler
//
// NOTE: These tests call handle_request() which dispatches to sessions.el
// functions that use engram_search_json. Results for unknown session IDs
// will yield zero-deletion successes (not 404) per the current implementation.
//
// To run:
// elc routes.el && ./soul --test tests/test_sessions_routes.el
//
//
import "../routes.el"
// Test harness
let pass_count: Int = 0
let fail_count: Int = 0
fn assert_eq(label: String, got: String, expected: String) -> Void {
if str_eq(got, expected) {
let pass_count = pass_count + 1
println(" PASS: " + label)
} else {
let fail_count = fail_count + 1
println(" FAIL: " + label)
println(" got: " + got)
println(" expected: " + expected)
}
}
fn assert_contains(label: String, haystack: String, needle: String) -> Void {
if str_contains(haystack, needle) {
let pass_count = pass_count + 1
println(" PASS: " + label)
} else {
let fail_count = fail_count + 1
println(" FAIL: " + label)
println(" missing '" + needle + "' in: " + haystack)
}
}
fn assert_not_contains(label: String, haystack: String, needle: String) -> Void {
if str_contains(haystack, needle) {
let fail_count = fail_count + 1
println(" FAIL: " + label)
println(" unexpected '" + needle + "' found in: " + haystack)
} else {
let pass_count = pass_count + 1
println(" PASS: " + label)
}
}
fn assert_true(label: String, cond: Bool) -> Void {
if cond {
let pass_count = pass_count + 1
println(" PASS: " + label)
} else {
let fail_count = fail_count + 1
println(" FAIL: " + label)
}
}
// Section 1: DELETE /api/sessions/:id unknown id
//
// session_delete does not return 404 for unknown ids; it returns ok:true with
// zero-count deletions. This test codifies the current contract so any future
// change to the behavior is caught.
println("")
println("1. DELETE /api/sessions/:id — unknown session_id")
let del_unknown: String = handle_request("DELETE", "/api/sessions/nonexistent-session-uuid", "")
assert_contains("DELETE unknown id -> ok field present", del_unknown, "\"ok\"")
assert_contains("DELETE unknown id -> ok is true (zero-count success)", del_unknown, "\"ok\":true")
assert_contains("DELETE unknown id -> deleted_meta count present", del_unknown, "deleted_meta")
assert_contains("DELETE unknown id -> deleted_msgs count present", del_unknown, "deleted_msgs")
// Section 2: DELETE /api/sessions/:id missing id
println("")
println("2. DELETE /api/sessions (no id in path) -> 404")
let del_no_id: String = handle_request("DELETE", "/api/sessions", "")
assert_contains("DELETE with no id -> 404 error", del_no_id, "\"error\"")
// Section 3: PATCH /api/sessions/:id update title
//
// PATCH with a known title field should not error on the missing-fields check.
// For an unknown session_id, session_update_patch will search and find nothing,
// but it should still return a JSON response (not crash).
println("")
println("3. PATCH /api/sessions/:id — title field")
let patch_title: String = handle_request("PATCH", "/api/sessions/test-sess-patch-1", "{\"title\":\"My new title\"}")
// Should return JSON with ok field or error field must not be empty
assert_not_contains("PATCH title -> response is not empty", patch_title, "")
assert_true("PATCH title -> response is non-empty string", str_len(patch_title) > 0)
// Must not return the missing-fields error (since title IS provided)
assert_not_contains("PATCH title -> no 'title or folder required' error", patch_title, "title or folder required")
// Section 4: PATCH /api/sessions/:id folder field
println("")
println("4. PATCH /api/sessions/:id — folder field")
let patch_folder: String = handle_request("PATCH", "/api/sessions/test-sess-patch-2", "{\"folder\":\"my-folder\"}")
assert_true("PATCH folder -> response is non-empty", str_len(patch_folder) > 0)
assert_not_contains("PATCH folder -> no 'title or folder required' error", patch_folder, "title or folder required")
// Section 5: PATCH /api/sessions/:id empty body (missing fields)
println("")
println("5. PATCH /api/sessions/:id — empty body returns field-required error")
let patch_empty: String = handle_request("PATCH", "/api/sessions/test-sess-patch-3", "{}")
assert_contains("PATCH empty body -> error field present", patch_empty, "\"error\"")
assert_contains("PATCH empty body -> missing fields message", patch_empty, "title or folder required")
// Section 6: PATCH /api/sessions (no id in path) -> 404
println("")
println("6. PATCH /api/sessions (no id) -> 404")
let patch_no_id: String = handle_request("PATCH", "/api/sessions", "{\"title\":\"x\"}")
assert_contains("PATCH no id -> 404 error", patch_no_id, "\"error\"")
// Section 7: GET /api/sessions session_list regression
//
// After removal of the duplicate route_sessions() GET handler in routes.el,
// GET /api/sessions must still return a valid JSON array (possibly empty) from
// session_list(). Verifies the deduplication fix does not break the endpoint.
println("")
println("7. GET /api/sessions — session_list() returns valid JSON array")
let get_sessions: String = handle_request("GET", "/api/sessions", "")
assert_true("GET /api/sessions -> response is non-empty", str_len(get_sessions) > 0)
// Result must be a JSON array (starts with '[')
let first_char: String = str_slice(get_sessions, 0, 1)
assert_eq("GET /api/sessions -> response is a JSON array", first_char, "[")
// Section 8: DELETE then GET session_index cache invalidation
//
// After a DELETE, session_list() must not return the deleted session.
// Since we don't have a real session to delete in this test environment,
// we verify the GET still returns an array after the DELETE attempt.
println("")
println("8. GET /api/sessions after DELETE attempt -> still returns valid array")
let del_first: String = handle_request("DELETE", "/api/sessions/test-cache-inval-sess", "")
assert_contains("pre-DELETE: ok field present", del_first, "\"ok\"")
let get_after_del: String = handle_request("GET", "/api/sessions", "")
let first_char2: String = str_slice(get_after_del, 0, 1)
assert_eq("GET after DELETE -> still returns JSON array", first_char2, "[")
// Summary
println("")
println("test_sessions_routes.el: " + int_to_str(pass_count) + " passed, " + int_to_str(fail_count) + " failed")