{"site":"potterybarn.com","overall_health":"degraded","tasks":[{"site":"potterybarn.com","task":"commerce.evaluate_returns_or_checkout","health":"degraded","aes":90,"outcome_rate":0.9,"known_blockers":["login_required","hidden_modal"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.21,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.24 effective weight, Wilson bounds 0.048038-0.999377, and Beta posterior mean 0.543181."},"freshness":{"updated_at":"2026-06-09T14:00:24.762Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781013624591-potterybarn-com-commerce-evaluate-returns-or-checkout","loop-1781013621089-potterybarn-com-commerce-evaluate-returns-or-checkout"],"latest_evidence_id":"loop-1781013624591-potterybarn-com-commerce-evaluate-returns-or-checkout","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Trust is based on 2 deduplicated trusted runs from 1 reporter."},"dimensions":[{"key":"reachability","score":78,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for reachability."},{"key":"navigability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for navigability."},{"key":"task_completability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for task_completability."},{"key":"transactability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for transactability."},{"key":"recoverability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for recoverability."},{"key":"policy_parseability","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for policy_parseability."},{"key":"trust_safety","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for trust_safety."},{"key":"efficiency","score":90,"sample_size":2,"rationale":"Derived from AES 90 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":100,"outcome_rate":1,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0.030539-1, and Beta posterior mean 0.528528."},"freshness":{"updated_at":"2026-06-09T14:00:21.420Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"known_blockers":["hidden_modal"]},{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser-direct","identity_class":"agent_user"},"aes":80,"outcome_rate":0.8,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0.01957-0.998754, and Beta posterior mean 0.517117."},"freshness":{"updated_at":"2026-06-09T14:00:24.762Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"known_blockers":["login_required","hidden_modal"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}],"incidents":[],"confidence":{"score":0.21,"level":"low","sample_size":2,"rationale":"Aggregated across available task-level confidence summaries."},"freshness":{"updated_at":"2026-06-09T14:00:24.762Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781013624591-potterybarn-com-commerce-evaluate-returns-or-checkout","loop-1781013621089-potterybarn-com-commerce-evaluate-returns-or-checkout"],"latest_evidence_id":"loop-1781013621089-potterybarn-com-commerce-evaluate-returns-or-checkout","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Aggregated across task or site trust summaries."},"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}