{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:YL73JPKXWGULTLS3EUPKO2JHOA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c78484ee8ced273c7113b3c1df7d99a9b644ac9b52d1ac5b0bb456cac97a64e8","cross_cats_sorted":["cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-05-22T04:41:37Z","title_canon_sha256":"43b270479da20916f0b44e7321bae7be2d4aa81f85c9b42f2c5659a59f5c435f"},"schema_version":"1.0","source":{"id":"1805.08389","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.08389","created_at":"2026-05-18T00:15:26Z"},{"alias_kind":"arxiv_version","alias_value":"1805.08389v1","created_at":"2026-05-18T00:15:26Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.08389","created_at":"2026-05-18T00:15:26Z"},{"alias_kind":"pith_short_12","alias_value":"YL73JPKXWGUL","created_at":"2026-05-18T12:33:04Z"},{"alias_kind":"pith_short_16","alias_value":"YL73JPKXWGULTLS3","created_at":"2026-05-18T12:33:04Z"},{"alias_kind":"pith_short_8","alias_value":"YL73JPKX","created_at":"2026-05-18T12:33:04Z"}],"graph_snapshots":[{"event_id":"sha256:a12ef7a8caee41e9d735269dd85f541e1df8df278977fcecc15f0c37198cae0f","target":"graph","created_at":"2026-05-18T00:15:26Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Answering visual questions need acquire daily common knowledge and model the semantic connection among different parts in images, which is too difficult for VQA systems to learn from images with the only supervision from answers. Meanwhile, image captioning systems with beam search strategy tend to generate similar captions and fail to diversely describe images. To address the aforementioned issues, we present a system to have these two tasks compensate with each other, which is capable of jointly producing image captions and answering visual questions. In particular, we utilize question and i","authors_text":"Jialin Wu, Raymond J. Mooney, Zeyuan Hu","cross_cats":["cs.CV"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-05-22T04:41:37Z","title":"Joint Image Captioning and Question Answering"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.08389","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0beb306da0c5bbeaf75391f32a70fa74eb2922281105e34d30dd3bfb80a20d3e","target":"record","created_at":"2026-05-18T00:15:26Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c78484ee8ced273c7113b3c1df7d99a9b644ac9b52d1ac5b0bb456cac97a64e8","cross_cats_sorted":["cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-05-22T04:41:37Z","title_canon_sha256":"43b270479da20916f0b44e7321bae7be2d4aa81f85c9b42f2c5659a59f5c435f"},"schema_version":"1.0","source":{"id":"1805.08389","kind":"arxiv","version":1}},"canonical_sha256":"c2ffb4bd57b1a8b9ae5b251ea7692770128cb1646f1c40df16e221f397f5b3d3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c2ffb4bd57b1a8b9ae5b251ea7692770128cb1646f1c40df16e221f397f5b3d3","first_computed_at":"2026-05-18T00:15:26.680224Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:15:26.680224Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"d5Z50t7TYrNAnkAUV4bDQFLiQK+abmyKxWWIxBQnPANoMn8iN72RIbaiGJqkEXlbLf1ijlYxUGmaCe7xMUwKCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:15:26.681129Z","signed_message":"canonical_sha256_bytes"},"source_id":"1805.08389","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0beb306da0c5bbeaf75391f32a70fa74eb2922281105e34d30dd3bfb80a20d3e","sha256:a12ef7a8caee41e9d735269dd85f541e1df8df278977fcecc15f0c37198cae0f"],"state_sha256":"98671e27a90d7e320c2a223359c6992413d652d0d091d0cf8a857757e3ea9091"}