{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:4FBPJ5J2S5P2I2L3O3KFJNTAIX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d3b87ada390d1e305b28b6ae7018d69d48f0246804038918ff0c5f69ab4c008b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T04:09:05Z","title_canon_sha256":"cecc86fe479f1354b98dfe0f5492671bcec1bf59b2be1d62e1a2718bffb0cd4b"},"schema_version":"1.0","source":{"id":"2606.24118","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24118","created_at":"2026-06-24T01:14:41Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24118v1","created_at":"2026-06-24T01:14:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24118","created_at":"2026-06-24T01:14:41Z"},{"alias_kind":"pith_short_12","alias_value":"4FBPJ5J2S5P2","created_at":"2026-06-24T01:14:41Z"},{"alias_kind":"pith_short_16","alias_value":"4FBPJ5J2S5P2I2L3","created_at":"2026-06-24T01:14:41Z"},{"alias_kind":"pith_short_8","alias_value":"4FBPJ5J2","created_at":"2026-06-24T01:14:41Z"}],"graph_snapshots":[{"event_id":"sha256:2b410ac5ae4eba0e1d5c59b9026efb0182d7b45ea2dc67c50e51c7ea9932cd61","target":"graph","created_at":"2026-06-24T01:14:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.24118/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Visual grounding in documents is a crucial ability for Large Multimodal Models (LMMs) in areas such as document understanding, deep research and document error detection. However, existing approaches exhibit poor grounding precision in text-rich document images, often failing to accurately locate the critical document elements needed for reliable reasoning. To address this gap, we introduce PreciseDoc, an LMM specifically designed for precise element grounding and can be further optimized for Document VQA tasks. Specifically, to enhance the basic localization capability, we construct challengi","authors_text":"Chuangxin Zhao, Ji Qi, Juanzi Li, Kai Sun, Lei Hou, Yijian Lu","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T04:09:05Z","title":"An LMM for Precisely Grounding Elements in Documents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24118","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6c5bb4fd82a40d630eec752b9419a9b4d4793935f361e18112008e87f490c092","target":"record","created_at":"2026-06-24T01:14:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d3b87ada390d1e305b28b6ae7018d69d48f0246804038918ff0c5f69ab4c008b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T04:09:05Z","title_canon_sha256":"cecc86fe479f1354b98dfe0f5492671bcec1bf59b2be1d62e1a2718bffb0cd4b"},"schema_version":"1.0","source":{"id":"2606.24118","kind":"arxiv","version":1}},"canonical_sha256":"e142f4f53a975fa4697b76d454b66045fb38e159c610177fe7180d8418ab1e91","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e142f4f53a975fa4697b76d454b66045fb38e159c610177fe7180d8418ab1e91","first_computed_at":"2026-06-24T01:14:41.564450Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-24T01:14:41.564450Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"daBmkUA9kCUPiA8SevfZz9m2i8o5yP+k4o+7ZyOK0mZ9q/lfDYiHnHWbGmWDRbIT8dt/8/w6sLPPjAs5p0tbDQ==","signature_status":"signed_v1","signed_at":"2026-06-24T01:14:41.564811Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.24118","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6c5bb4fd82a40d630eec752b9419a9b4d4793935f361e18112008e87f490c092","sha256:2b410ac5ae4eba0e1d5c59b9026efb0182d7b45ea2dc67c50e51c7ea9932cd61"],"state_sha256":"aa63b2644f680fc43bd142bff536e5bcf20f994831bde29a51aac3766fe5d812"}