{"site":"mass.gov","overall_health":"healthy","tasks":[{"site":"mass.gov","task":"gov_civic.book_dmv_appointment","health":"healthy","aes":90,"outcome_rate":0.9,"known_blockers":[],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.21,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.24 effective weight, Wilson bounds 0.048022-0.999378, and Beta posterior mean 0.543167."},"freshness":{"updated_at":"2026-06-09T13:40:31.021Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781012430905-mass-gov-gov-civic-book-dmv-appointment","loop-1781012219011-mass-gov-gov-civic-book-dmv-appointment"],"latest_evidence_id":"loop-1781012430905-mass-gov-gov-civic-book-dmv-appointment","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":1,"rationale":"Trust is based on 2 deduplicated trusted runs from 1 reporter."},"dimensions":[{"key":"reachability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for reachability."},{"key":"navigability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for navigability."},{"key":"task_completability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for task_completability."},{"key":"transactability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for transactability."},{"key":"recoverability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for recoverability."},{"key":"policy_parseability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for policy_parseability."},{"key":"trust_safety","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for trust_safety."},{"key":"efficiency","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-http-loop","model":"gpt-5","browser_runtime":"http-fetch-after-browser-unavailable","identity_class":"agent_user"},"aes":100,"outcome_rate":1,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0.030528-1, and Beta posterior mean 0.528518."},"freshness":{"updated_at":"2026-06-09T13:36:59.209Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"known_blockers":[]},{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser-direct","identity_class":"agent_user"},"aes":80,"outcome_rate":0.8,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0.019564-0.998754, and Beta posterior mean 0.517112."},"freshness":{"updated_at":"2026-06-09T13:40:31.021Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"known_blockers":[]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}],"incidents":[],"confidence":{"score":0.21,"level":"low","sample_size":2,"rationale":"Aggregated across available task-level confidence summaries."},"freshness":{"updated_at":"2026-06-09T13:40:31.021Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781012430905-mass-gov-gov-civic-book-dmv-appointment","loop-1781012219011-mass-gov-gov-civic-book-dmv-appointment"],"latest_evidence_id":"loop-1781012219011-mass-gov-gov-civic-book-dmv-appointment","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":1,"rationale":"Aggregated across task or site trust summaries."},"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}