{"site":"northwell.edu","overall_health":"constrained","tasks":[{"site":"northwell.edu","task":"healthcare_admin.book_appointment","health":"constrained","aes":40,"outcome_rate":0.4,"known_blockers":["login_required","navigation_failed"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.12,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.24 effective weight, Wilson bounds 0.009701-0.978437, and Beta posterior mean 0.489198."},"freshness":{"updated_at":"2026-06-09T15:01:23.863Z","age_days":4,"status":"fresh","rationale":"Latest evidence is 4 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781017283679-northwell-edu-healthcare-admin-book-appointment","loop-1781016985289-northwell-edu-healthcare-admin-book-appointment"],"latest_evidence_id":"loop-1781017283679-northwell-edu-healthcare-admin-book-appointment","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Trust is based on 2 deduplicated trusted runs from 1 reporter."},"dimensions":[{"key":"reachability","score":28,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for reachability."},{"key":"navigability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for navigability."},{"key":"task_completability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for task_completability."},{"key":"transactability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for transactability."},{"key":"recoverability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for recoverability."},{"key":"policy_parseability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for policy_parseability."},{"key":"trust_safety","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for trust_safety."},{"key":"efficiency","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"http-repair-current-official-public-url","identity_class":"agent_user"},"aes":80,"outcome_rate":0.8,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0.019588-0.998753, and Beta posterior mean 0.517132."},"freshness":{"updated_at":"2026-06-09T15:01:23.863Z","age_days":4,"status":"fresh","rationale":"Latest evidence is 4 days old."},"known_blockers":["login_required"]},{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":0,"outcome_rate":0,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0-0.969434, and Beta posterior mean 0.471448."},"freshness":{"updated_at":"2026-06-09T14:56:25.431Z","age_days":4,"status":"fresh","rationale":"Latest evidence is 4 days old."},"known_blockers":["navigation_failed"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}],"incidents":[],"confidence":{"score":0.12,"level":"low","sample_size":2,"rationale":"Aggregated across available task-level confidence summaries."},"freshness":{"updated_at":"2026-06-09T15:01:23.863Z","age_days":4,"status":"fresh","rationale":"Latest evidence is 4 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781017283679-northwell-edu-healthcare-admin-book-appointment","loop-1781016985289-northwell-edu-healthcare-admin-book-appointment"],"latest_evidence_id":"loop-1781016985289-northwell-edu-healthcare-admin-book-appointment","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Aggregated across task or site trust summaries."},"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}