{"site":"avianca.com","overall_health":"constrained","tasks":[{"site":"avianca.com","task":"travel.manage_flight_reservation","health":"constrained","aes":40,"outcome_rate":0.4,"known_blockers":["hidden_modal","navigation_failed"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.12,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.24 effective weight, Wilson bounds 0.009703-0.978471, and Beta posterior mean 0.48923."},"freshness":{"updated_at":"2026-06-09T14:33:34.669Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781015614524-avianca-com-travel-manage-flight-reservation","loop-1781011284141-avianca-com-travel-manage-flight-reservation"],"latest_evidence_id":"loop-1781015614524-avianca-com-travel-manage-flight-reservation","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Trust is based on 2 deduplicated trusted runs from 1 reporter."},"dimensions":[{"key":"reachability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for reachability."},{"key":"navigability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for navigability."},{"key":"task_completability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for task_completability."},{"key":"transactability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for transactability."},{"key":"recoverability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for recoverability."},{"key":"policy_parseability","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for policy_parseability."},{"key":"trust_safety","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for trust_safety."},{"key":"efficiency","score":40,"sample_size":2,"rationale":"Derived from AES 40 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"fallback-playwright-repair-after-iab-unavailable","identity_class":"agent_user"},"aes":80,"outcome_rate":0.8,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0.01958-0.998753, and Beta posterior mean 0.517126."},"freshness":{"updated_at":"2026-06-09T14:33:34.669Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"known_blockers":["hidden_modal"]},{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"fallback-playwright-after-iab-failure","identity_class":"agent_user"},"aes":0,"outcome_rate":0,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.12 effective weight, Wilson bounds 0-0.969478, and Beta posterior mean 0.471488."},"freshness":{"updated_at":"2026-06-09T13:21:24.316Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"known_blockers":["navigation_failed"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}],"incidents":[],"confidence":{"score":0.12,"level":"low","sample_size":2,"rationale":"Aggregated across available task-level confidence summaries."},"freshness":{"updated_at":"2026-06-09T14:33:34.669Z","age_days":4.1,"status":"fresh","rationale":"Latest evidence is 4.1 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781015614524-avianca-com-travel-manage-flight-reservation","loop-1781011284141-avianca-com-travel-manage-flight-reservation"],"latest_evidence_id":"loop-1781011284141-avianca-com-travel-manage-flight-reservation","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Aggregated across task or site trust summaries."},"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}