{"site":"aa.com","overall_health":"blocked","tasks":[{"site":"aa.com","task":"travel.cancel_flight","health":"degraded","aes":75,"outcome_rate":0.75,"known_blockers":["confirmation_email_missing"],"recipe_uri":"recipe://travel.cancel_flight/aa-reservations-faq-cancel/v1","policy_notes":{"observation_method":"public_official_help_or_docs_page","observation_date":"2026-06-17","cancellation_path":"find_your_trip_or_aadvantage_cancel_trip","refund_branching":"fare_type_and_24_hour_rule_dependent","confirmation":"cancellation_information_sent_by_email","source_urls":"https://www.aa.com/pubcontent/en_US/customer-service/faqs/reservations-tickets-faqs.jsp | https://www.aa.com/refunds/"},"confidence":{"score":0.28,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.7 effective weight, Wilson bounds 0.087624-0.989442, and Beta posterior mean 0.564815."},"freshness":{"updated_at":"2026-06-17T02:28:12.679Z","age_days":0,"status":"fresh","rationale":"Latest evidence is 0 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["public-aa-reservations-faq-cancel","public-aa-refunds"],"latest_evidence_id":"public-aa-refunds","notes":["American Airlines documents trip cancellation from Find your trip or AAdvantage account, with email confirmation and refund rules dependent on fare and timing.","Source: https://www.aa.com/pubcontent/en_US/customer-service/faqs/reservations-tickets-faqs.jsp","Source: https://www.aa.com/refunds/"]},"trust":{"score":0.32,"level":"low","reporter_count":0,"deduplicated_evidence_count":0,"quarantined_count":0,"rationale":"Low-trust public web observation from official or public task documentation; treat as directional until measured agent runs arrive."},"dimensions":[{"key":"reachability","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for reachability."},{"key":"navigability","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for navigability."},{"key":"task_completability","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for task_completability."},{"key":"transactability","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for transactability."},{"key":"recoverability","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for recoverability."},{"key":"policy_parseability","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for policy_parseability."},{"key":"trust_safety","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for trust_safety."},{"key":"efficiency","score":75,"sample_size":2,"rationale":"Derived from AES 75 and observed friction for efficiency."}],"segments":[],"recommended_actions":[{"priority":"high","actor":"agent","action":"Pause before American Airlines final cancellation confirmation.","expected_impact":"Prevents irreversible travel changes when fare refund rules are still ambiguous."}]},{"site":"aa.com","task":"travel.find_refund_policy","health":"constrained","aes":40,"outcome_rate":0.4,"known_blockers":["dynamic_dom_unstable"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.00459-0.989732, and Beta posterior mean 0.494686."},"freshness":{"updated_at":"2026-06-09T18:18:05.193Z","age_days":7.3,"status":"aging","rationale":"Latest evidence is 7.3 days old."},"evidence":{"sample_size":1,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781029085013-aa-com-travel-find-refund-policy"],"latest_evidence_id":"loop-1781029085013-aa-com-travel-find-refund-policy","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":1,"quarantined_count":0,"rationale":"Trust is based on 1 deduplicated trusted run from 1 reporter."},"dimensions":[{"key":"reachability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for reachability."},{"key":"navigability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for navigability."},{"key":"task_completability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for task_completability."},{"key":"transactability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for transactability."},{"key":"recoverability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for recoverability."},{"key":"policy_parseability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for policy_parseability."},{"key":"trust_safety","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for trust_safety."},{"key":"efficiency","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":40,"outcome_rate":0.4,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.00459-0.989732, and Beta posterior mean 0.494686."},"freshness":{"updated_at":"2026-06-09T18:18:05.193Z","age_days":7.3,"status":"aging","rationale":"Latest evidence is 7.3 days old."},"known_blockers":["dynamic_dom_unstable"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]},{"site":"aa.com","task":"travel.find_baggage_policy","health":"healthy","aes":100,"outcome_rate":1,"known_blockers":[],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.028361-1, and Beta posterior mean 0.526545."},"freshness":{"updated_at":"2026-06-09T17:11:17.358Z","age_days":7.4,"status":"aging","rationale":"Latest evidence is 7.4 days old."},"evidence":{"sample_size":1,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781025077177-aa-com-travel-find-baggage-policy"],"latest_evidence_id":"loop-1781025077177-aa-com-travel-find-baggage-policy","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":1,"quarantined_count":0,"rationale":"Trust is based on 1 deduplicated trusted run from 1 reporter."},"dimensions":[{"key":"reachability","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for reachability."},{"key":"navigability","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for navigability."},{"key":"task_completability","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for task_completability."},{"key":"transactability","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for transactability."},{"key":"recoverability","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for recoverability."},{"key":"policy_parseability","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for policy_parseability."},{"key":"trust_safety","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for trust_safety."},{"key":"efficiency","score":100,"sample_size":1,"rationale":"Derived from AES 100 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":100,"outcome_rate":1,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.028361-1, and Beta posterior mean 0.526545."},"freshness":{"updated_at":"2026-06-09T17:11:17.358Z","age_days":7.4,"status":"aging","rationale":"Latest evidence is 7.4 days old."},"known_blockers":[]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]},{"site":"aa.com","task":"future_agent_tasks.monitor_prices","health":"constrained","aes":40,"outcome_rate":0.4,"known_blockers":["dynamic_dom_unstable"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.004566-0.989786, and Beta posterior mean 0.494712."},"freshness":{"updated_at":"2026-06-09T12:46:12.378Z","age_days":7.6,"status":"aging","rationale":"Latest evidence is 7.6 days old."},"evidence":{"sample_size":1,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781009172313-aa-com-future-agent-tasks-monitor-prices"],"latest_evidence_id":"loop-1781009172313-aa-com-future-agent-tasks-monitor-prices","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":1,"quarantined_count":0,"rationale":"Trust is based on 1 deduplicated trusted run from 1 reporter."},"dimensions":[{"key":"reachability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for reachability."},{"key":"navigability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for navigability."},{"key":"task_completability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for task_completability."},{"key":"transactability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for transactability."},{"key":"recoverability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for recoverability."},{"key":"policy_parseability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for policy_parseability."},{"key":"trust_safety","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for trust_safety."},{"key":"efficiency","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":40,"outcome_rate":0.4,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.004566-0.989785, and Beta posterior mean 0.494712."},"freshness":{"updated_at":"2026-06-09T12:46:12.378Z","age_days":7.6,"status":"aging","rationale":"Latest evidence is 7.6 days old."},"known_blockers":["dynamic_dom_unstable"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]},{"site":"aa.com","task":"customer_support.flight_help","health":"blocked","aes":20,"outcome_rate":0.2,"known_blockers":["dynamic_dom_unstable","navigation_failed"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.18,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.22 effective weight, Wilson bounds 0.002276-0.964789, and Beta posterior mean 0.469891."},"freshness":{"updated_at":"2026-06-09T11:53:03.474Z","age_days":7.6,"status":"aging","rationale":"Latest evidence is 7.6 days old."},"evidence":{"sample_size":2,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781005983239-aa-com-customer-support-flight-help","loop-1781005868056-aa-com-customer-support-flight-help"],"latest_evidence_id":"loop-1781005983239-aa-com-customer-support-flight-help","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":2,"quarantined_count":0,"rationale":"Trust is based on 2 deduplicated trusted runs from 1 reporter."},"dimensions":[{"key":"reachability","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for reachability."},{"key":"navigability","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for navigability."},{"key":"task_completability","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for task_completability."},{"key":"transactability","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for transactability."},{"key":"recoverability","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for recoverability."},{"key":"policy_parseability","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for policy_parseability."},{"key":"trust_safety","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for trust_safety."},{"key":"efficiency","score":20,"sample_size":2,"rationale":"Derived from AES 20 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":20,"outcome_rate":0.2,"sample_size":2,"confidence":{"score":0.18,"level":"low","sample_size":2,"rationale":"Confidence reflects 0.22 effective weight, Wilson bounds 0.002276-0.96479, and Beta posterior mean 0.469891."},"freshness":{"updated_at":"2026-06-09T11:53:03.474Z","age_days":7.6,"status":"aging","rationale":"Latest evidence is 7.6 days old."},"known_blockers":["dynamic_dom_unstable","navigation_failed"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]},{"site":"aa.com","task":"travel.manage_flight_reservation","health":"constrained","aes":40,"outcome_rate":0.4,"known_blockers":["dynamic_dom_unstable"],"recipe_uri":null,"policy_notes":{},"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.00456-0.989798, and Beta posterior mean 0.494718."},"freshness":{"updated_at":"2026-06-09T11:31:28.121Z","age_days":7.6,"status":"aging","rationale":"Latest evidence is 7.6 days old."},"evidence":{"sample_size":1,"source_tiers":["public_web_observation"],"evidence_ids":["loop-1781004688022-aa-com-travel-manage-flight-reservation"],"latest_evidence_id":"loop-1781004688022-aa-com-travel-manage-flight-reservation","notes":["Status is derived from reported runs stored in this server process."]},"trust":{"score":0.38,"level":"low","reporter_count":1,"deduplicated_evidence_count":1,"quarantined_count":0,"rationale":"Trust is based on 1 deduplicated trusted run from 1 reporter."},"dimensions":[{"key":"reachability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for reachability."},{"key":"navigability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for navigability."},{"key":"task_completability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for task_completability."},{"key":"transactability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for transactability."},{"key":"recoverability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for recoverability."},{"key":"policy_parseability","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for policy_parseability."},{"key":"trust_safety","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for trust_safety."},{"key":"efficiency","score":40,"sample_size":1,"rationale":"Derived from AES 40 and observed friction for efficiency."}],"segments":[{"segment":{"stack":"codex-browser-loop","model":"gpt-5","browser_runtime":"codex-in-app-browser","identity_class":"agent_user"},"aes":40,"outcome_rate":0.4,"sample_size":1,"confidence":{"score":0.23,"level":"low","sample_size":1,"rationale":"Confidence reflects 0.11 effective weight, Wilson bounds 0.00456-0.989797, and Beta posterior mean 0.494718."},"freshness":{"updated_at":"2026-06-09T11:31:28.121Z","age_days":7.6,"status":"aging","rationale":"Latest evidence is 7.6 days old."},"known_blockers":["dynamic_dom_unstable"]}],"recommended_actions":[{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}],"incidents":[{"id":"incident_aa_com_customer_support_flight_help","task":"customer_support.flight_help","severity":"high","opened_at":"2026-06-09T11:53:03.474Z","status":"open","summary":"Blocking friction observed for customer_support.flight_help: dynamic_dom_unstable, navigation_failed"}],"confidence":{"score":0.23,"level":"low","sample_size":8,"rationale":"Aggregated across available task-level confidence summaries."},"freshness":{"updated_at":"2026-06-17T02:28:12.679Z","age_days":0,"status":"fresh","rationale":"Latest evidence is 0 days old."},"evidence":{"sample_size":8,"source_tiers":["public_web_observation"],"evidence_ids":["public-aa-reservations-faq-cancel","public-aa-refunds","loop-1781029085013-aa-com-travel-find-refund-policy","loop-1781025077177-aa-com-travel-find-baggage-policy","loop-1781009172313-aa-com-future-agent-tasks-monitor-prices","loop-1781005983239-aa-com-customer-support-flight-help","loop-1781005868056-aa-com-customer-support-flight-help","loop-1781004688022-aa-com-travel-manage-flight-reservation"],"latest_evidence_id":"loop-1781004688022-aa-com-travel-manage-flight-reservation","notes":["American Airlines documents trip cancellation from Find your trip or AAdvantage account, with email confirmation and refund rules dependent on fare and timing.","Source: https://www.aa.com/pubcontent/en_US/customer-service/faqs/reservations-tickets-faqs.jsp","Source: https://www.aa.com/refunds/","Status is derived from reported runs stored in this server process."]},"trust":{"score":0.37,"level":"low","reporter_count":5,"deduplicated_evidence_count":6,"quarantined_count":0,"rationale":"Aggregated across task or site trust summaries."},"recommended_actions":[{"priority":"high","actor":"agent","action":"Pause before American Airlines final cancellation confirmation.","expected_impact":"Prevents irreversible travel changes when fare refund rules are still ambiguous."},{"priority":"medium","actor":"agent","action":"Use preflight output as the execution guardrail and report the final outcome.","expected_impact":"Improves future confidence and catches drift."}]}