{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:6ECJ74ASL4PIDGBCPWBHQEOYUF","short_pith_number":"pith:6ECJ74AS","canonical_record":{"source":{"id":"1612.00576","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-02T06:50:49Z","cross_cats_sorted":[],"title_canon_sha256":"2286c7547cd9e178ba6f8841562fe863e13a56e3822adb20765c05e4a7bb9167","abstract_canon_sha256":"fdf81c2d607faceef0b292b4ab0ce934df9d5352cf95753d6731d0edb94a4d75"},"schema_version":"1.0"},"canonical_sha256":"f1049ff0125f1e8198227d827811d8a15e353b1cc046f59eb4bc1272b54579d5","source":{"kind":"arxiv","id":"1612.00576","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1612.00576","created_at":"2026-05-18T00:39:56Z"},{"alias_kind":"arxiv_version","alias_value":"1612.00576v2","created_at":"2026-05-18T00:39:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.00576","created_at":"2026-05-18T00:39:56Z"},{"alias_kind":"pith_short_12","alias_value":"6ECJ74ASL4PI","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_16","alias_value":"6ECJ74ASL4PIDGBC","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_8","alias_value":"6ECJ74AS","created_at":"2026-05-18T12:30:01Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:6ECJ74ASL4PIDGBCPWBHQEOYUF","target":"record","payload":{"canonical_record":{"source":{"id":"1612.00576","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-02T06:50:49Z","cross_cats_sorted":[],"title_canon_sha256":"2286c7547cd9e178ba6f8841562fe863e13a56e3822adb20765c05e4a7bb9167","abstract_canon_sha256":"fdf81c2d607faceef0b292b4ab0ce934df9d5352cf95753d6731d0edb94a4d75"},"schema_version":"1.0"},"canonical_sha256":"f1049ff0125f1e8198227d827811d8a15e353b1cc046f59eb4bc1272b54579d5","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:39:56.836611Z","signature_b64":"Sl39iYEfNaZ0c9hB4RXNM/uth1B9Br3g0wDBPVMSGLjdOk8n+dHCIZLoA5uf6Zb7gjbYwRFIcLD3mNmJuGxVDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f1049ff0125f1e8198227d827811d8a15e353b1cc046f59eb4bc1272b54579d5","last_reissued_at":"2026-05-18T00:39:56.836157Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:39:56.836157Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1612.00576","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+2Jx0dWz/essb1uXzISREvqme8CqTqZrndKx6+FvRxST6UqQMSnUgrdY+IZFSWTze4Lp1jeitkefcTJQrZbSDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T23:55:03.167715Z"},"content_sha256":"7e2a3998f37463029377cbd32af46b6e001d3ba0a0b54efb8ca12d25a8bebe6f","schema_version":"1.0","event_id":"sha256:7e2a3998f37463029377cbd32af46b6e001d3ba0a0b54efb8ca12d25a8bebe6f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:6ECJ74ASL4PIDGBCPWBHQEOYUF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Guided Open Vocabulary Image Captioning with Constrained Beam Search","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Basura Fernando, Mark Johnson, Peter Anderson, Stephen Gould","submitted_at":"2016-12-02T06:50:49Z","abstract_excerpt":"Existing image captioning models do not generalize well to out-of-domain images containing novel scenes or objects. This limitation severely hinders the use of these models in real world applications dealing with images in the wild. We address this problem using a flexible approach that enables existing deep captioning architectures to take advantage of image taggers at test time, without re-training. Our method uses constrained beam search to force the inclusion of selected tag words in the output, and fixed, pretrained word embeddings to facilitate vocabulary expansion to previously unseen t"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.00576","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mTUf0HoyCVb3h8jYU7S6AhhgHxR9w96+veOGWzKJWFs/KDOVnRQvD0wBk38sWbrza2pvbK3NMNGvqtZtux1FDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T23:55:03.168460Z"},"content_sha256":"8c855319dea29b7ef9537f1069c594c819318eeec697610607002b81a1a587fc","schema_version":"1.0","event_id":"sha256:8c855319dea29b7ef9537f1069c594c819318eeec697610607002b81a1a587fc"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF/bundle.json","state_url":"https://pith.science/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T23:55:03Z","links":{"resolver":"https://pith.science/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF","bundle":"https://pith.science/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF/bundle.json","state":"https://pith.science/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6ECJ74ASL4PIDGBCPWBHQEOYUF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:6ECJ74ASL4PIDGBCPWBHQEOYUF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fdf81c2d607faceef0b292b4ab0ce934df9d5352cf95753d6731d0edb94a4d75","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-02T06:50:49Z","title_canon_sha256":"2286c7547cd9e178ba6f8841562fe863e13a56e3822adb20765c05e4a7bb9167"},"schema_version":"1.0","source":{"id":"1612.00576","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1612.00576","created_at":"2026-05-18T00:39:56Z"},{"alias_kind":"arxiv_version","alias_value":"1612.00576v2","created_at":"2026-05-18T00:39:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.00576","created_at":"2026-05-18T00:39:56Z"},{"alias_kind":"pith_short_12","alias_value":"6ECJ74ASL4PI","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_16","alias_value":"6ECJ74ASL4PIDGBC","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_8","alias_value":"6ECJ74AS","created_at":"2026-05-18T12:30:01Z"}],"graph_snapshots":[{"event_id":"sha256:8c855319dea29b7ef9537f1069c594c819318eeec697610607002b81a1a587fc","target":"graph","created_at":"2026-05-18T00:39:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Existing image captioning models do not generalize well to out-of-domain images containing novel scenes or objects. This limitation severely hinders the use of these models in real world applications dealing with images in the wild. We address this problem using a flexible approach that enables existing deep captioning architectures to take advantage of image taggers at test time, without re-training. Our method uses constrained beam search to force the inclusion of selected tag words in the output, and fixed, pretrained word embeddings to facilitate vocabulary expansion to previously unseen t","authors_text":"Basura Fernando, Mark Johnson, Peter Anderson, Stephen Gould","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-02T06:50:49Z","title":"Guided Open Vocabulary Image Captioning with Constrained Beam Search"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.00576","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7e2a3998f37463029377cbd32af46b6e001d3ba0a0b54efb8ca12d25a8bebe6f","target":"record","created_at":"2026-05-18T00:39:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fdf81c2d607faceef0b292b4ab0ce934df9d5352cf95753d6731d0edb94a4d75","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-02T06:50:49Z","title_canon_sha256":"2286c7547cd9e178ba6f8841562fe863e13a56e3822adb20765c05e4a7bb9167"},"schema_version":"1.0","source":{"id":"1612.00576","kind":"arxiv","version":2}},"canonical_sha256":"f1049ff0125f1e8198227d827811d8a15e353b1cc046f59eb4bc1272b54579d5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f1049ff0125f1e8198227d827811d8a15e353b1cc046f59eb4bc1272b54579d5","first_computed_at":"2026-05-18T00:39:56.836157Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:39:56.836157Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Sl39iYEfNaZ0c9hB4RXNM/uth1B9Br3g0wDBPVMSGLjdOk8n+dHCIZLoA5uf6Zb7gjbYwRFIcLD3mNmJuGxVDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:39:56.836611Z","signed_message":"canonical_sha256_bytes"},"source_id":"1612.00576","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7e2a3998f37463029377cbd32af46b6e001d3ba0a0b54efb8ca12d25a8bebe6f","sha256:8c855319dea29b7ef9537f1069c594c819318eeec697610607002b81a1a587fc"],"state_sha256":"5f182f0e5f887f1380d59db0c326adc042570ead7c25830f40d995e3be716735"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UGTN7wYXTqzfLZD7JFHcDZ/KP03GDitovn651VQViOUiHF8rpcamQVim1yAVX1E7m/tKTXeGtFzdEDSU3YD8Bw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T23:55:03.172097Z","bundle_sha256":"3c00f783712d02cfb42797b8da2d331a8950ed75f7b97f7acae22e340cc8415b"}}