{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ZIYN26PLHZV3WX5WPSDFUTI6R2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4841ab5d47b0554976d904cb4fee88a62b4bf0cbe9cf4f844c0a546e636f01cf","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T16:14:47Z","title_canon_sha256":"03b2356db85ccb2c9dfd6ddbe05f164e7dcf0f1cc3e4e29d0f073cb62f4adb9f"},"schema_version":"1.0","source":{"id":"2605.28683","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.28683","created_at":"2026-05-28T02:04:59Z"},{"alias_kind":"arxiv_version","alias_value":"2605.28683v1","created_at":"2026-05-28T02:04:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28683","created_at":"2026-05-28T02:04:59Z"},{"alias_kind":"pith_short_12","alias_value":"ZIYN26PLHZV3","created_at":"2026-05-28T02:04:59Z"},{"alias_kind":"pith_short_16","alias_value":"ZIYN26PLHZV3WX5W","created_at":"2026-05-28T02:04:59Z"},{"alias_kind":"pith_short_8","alias_value":"ZIYN26PL","created_at":"2026-05-28T02:04:59Z"}],"graph_snapshots":[{"event_id":"sha256:8bfda959b348c8941faafdf4be2ce450949a635aafc9bfc642f1b858eef7c6ba","target":"graph","created_at":"2026-05-28T02:04:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.28683/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Existing benchmarks have laid the foundation for travel planning agents by establishing API-centric paradigms. However, as the capabilities of Autonomous Agents continue to advance, their evaluation must evolve beyond simple tool execution toward handling the inherent complexities of the open web. Current benchmarks bypass core cognitive hurdles: they fail to account for information noise, ignore multi-source factual contradictions, and overlook the necessity of grounding visual perception into logical planning. We introduce VeriTrip, a verifiable benchmark designed to meet the increasing dema","authors_text":"Hang Zhang, Jian Liang, Jiayi Tian, Mu Xu, Xiao-Yu Zhang, Xin Xiong, Yuting Xu","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T16:14:47Z","title":"VeriTrip: A Verifiable Benchmark for Travel Planning Agents over Unstructured Web Corpora"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28683","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8f9dddec7894c68e5988b342e6e38d3450c0940b71979b9bc6df40ff4577e7f2","target":"record","created_at":"2026-05-28T02:04:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4841ab5d47b0554976d904cb4fee88a62b4bf0cbe9cf4f844c0a546e636f01cf","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T16:14:47Z","title_canon_sha256":"03b2356db85ccb2c9dfd6ddbe05f164e7dcf0f1cc3e4e29d0f073cb62f4adb9f"},"schema_version":"1.0","source":{"id":"2605.28683","kind":"arxiv","version":1}},"canonical_sha256":"ca30dd79eb3e6bbb5fb67c865a4d1e8ea698c916ba81a337a715fc8439df3e96","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ca30dd79eb3e6bbb5fb67c865a4d1e8ea698c916ba81a337a715fc8439df3e96","first_computed_at":"2026-05-28T02:04:59.759095Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-28T02:04:59.759095Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UijT/ybdJBciuSHuhSbagez0Kh+pSrUcKYFO+urmHIixmyd8IsN+DKZca8JqN+QndzIuv9l+Xy1ueVDt316uDw==","signature_status":"signed_v1","signed_at":"2026-05-28T02:04:59.759512Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.28683","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8f9dddec7894c68e5988b342e6e38d3450c0940b71979b9bc6df40ff4577e7f2","sha256:8bfda959b348c8941faafdf4be2ce450949a635aafc9bfc642f1b858eef7c6ba"],"state_sha256":"c3c05b1df7f6c34db93f64b577d1acdb98d055588db62f92600c3919baafb4f5"}