{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:AKPT4QRHCFVF5H3ZYHEHZ5FAXF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4f018b4ff56fd919ed8d58c841d4b246300ccca637c7e9757bc886dfcb16230a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-25T12:00:45Z","title_canon_sha256":"ffed647fbea39eca8e1248902e40ed0052780bcf88b49ec6bf4dde5805423fc0"},"schema_version":"1.0","source":{"id":"2606.26923","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.26923","created_at":"2026-06-26T01:16:04Z"},{"alias_kind":"arxiv_version","alias_value":"2606.26923v1","created_at":"2026-06-26T01:16:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.26923","created_at":"2026-06-26T01:16:04Z"},{"alias_kind":"pith_short_12","alias_value":"AKPT4QRHCFVF","created_at":"2026-06-26T01:16:04Z"},{"alias_kind":"pith_short_16","alias_value":"AKPT4QRHCFVF5H3Z","created_at":"2026-06-26T01:16:04Z"},{"alias_kind":"pith_short_8","alias_value":"AKPT4QRH","created_at":"2026-06-26T01:16:04Z"}],"graph_snapshots":[{"event_id":"sha256:2c5bc541f2f5a150d4c5e1eb37e3010c089435b535eafac5c20fc7c17eb645e8","target":"graph","created_at":"2026-06-26T01:16:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.26923/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Vision-language models (VLMs) often produce hallucinated or inconsistent outputs, where text and images are not properly aligned. Addressing this issue requires not only detecting misalignment but also explaining the discrepancy and localizing its visual evidence. We introduce GAVEL (Grounded Caption Error Verification and Localization), a task that jointly addresses verification, explanation, and localization for image-text pairs. To support systematic evaluation, we also present a corresponding dataset and benchmark. We further train a supervised baseline on the human-annotated training spli","authors_text":"Atsushi Hashimoto, Kuniaki Saito, Zixian Gao","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-25T12:00:45Z","title":"GAVEL: Grounded Caption Error Verification and Localization"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.26923","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:62f2221ed2ba51eaaa9d34d12771a31d693d80ee6dbc8bd04ace1c4d583a5555","target":"record","created_at":"2026-06-26T01:16:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4f018b4ff56fd919ed8d58c841d4b246300ccca637c7e9757bc886dfcb16230a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-25T12:00:45Z","title_canon_sha256":"ffed647fbea39eca8e1248902e40ed0052780bcf88b49ec6bf4dde5805423fc0"},"schema_version":"1.0","source":{"id":"2606.26923","kind":"arxiv","version":1}},"canonical_sha256":"029f3e4227116a5e9f79c1c87cf4a0b9752234a6b90619e2f97d52eb8d57c69d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"029f3e4227116a5e9f79c1c87cf4a0b9752234a6b90619e2f97d52eb8d57c69d","first_computed_at":"2026-06-26T01:16:04.212758Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-26T01:16:04.212758Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Gp/C5FEJqEHt2Kym/YKU83NOXBKL9mcy49ciR294SPPeQuTJdENaBpM5mrnz00dsvr0waR1b0que6abP0CBqAA==","signature_status":"signed_v1","signed_at":"2026-06-26T01:16:04.213154Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.26923","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:62f2221ed2ba51eaaa9d34d12771a31d693d80ee6dbc8bd04ace1c4d583a5555","sha256:2c5bc541f2f5a150d4c5e1eb37e3010c089435b535eafac5c20fc7c17eb645e8"],"state_sha256":"6f99e15eebf39d1f13c7a8d69fe158c49809a40387638d56e19844e6efbaff4e"}