{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:R7EGEVLGK463WXZX75EOBHEWRC","short_pith_number":"pith:R7EGEVLG","canonical_record":{"source":{"id":"1904.01655","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-04-02T20:27:42Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"e82b9c984be3d90c152b2423da3b0658e941c51f17f01965ad465754ffc6b253","abstract_canon_sha256":"98cf058437a977afd9cddfe73c7468d8a8441dee8121b638960d3b932d1267de"},"schema_version":"1.0"},"canonical_sha256":"8fc8625566573dbb5f37ff48e09c96888ddf1ebdbc03765b68850f1420861954","source":{"kind":"arxiv","id":"1904.01655","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.01655","created_at":"2026-05-17T23:49:30Z"},{"alias_kind":"arxiv_version","alias_value":"1904.01655v1","created_at":"2026-05-17T23:49:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.01655","created_at":"2026-05-17T23:49:30Z"},{"alias_kind":"pith_short_12","alias_value":"R7EGEVLGK463","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"R7EGEVLGK463WXZX","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"R7EGEVLG","created_at":"2026-05-18T12:33:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:R7EGEVLGK463WXZX75EOBHEWRC","target":"record","payload":{"canonical_record":{"source":{"id":"1904.01655","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-04-02T20:27:42Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"e82b9c984be3d90c152b2423da3b0658e941c51f17f01965ad465754ffc6b253","abstract_canon_sha256":"98cf058437a977afd9cddfe73c7468d8a8441dee8121b638960d3b932d1267de"},"schema_version":"1.0"},"canonical_sha256":"8fc8625566573dbb5f37ff48e09c96888ddf1ebdbc03765b68850f1420861954","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:49:30.352986Z","signature_b64":"eIQqryPHYYtxi72wrhYq/5IK1rWQaqjv49b8OZID7HMVtc0l8NCDBJtXuR/0q47zqIoLCBY7CruD5Xv9lOphCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8fc8625566573dbb5f37ff48e09c96888ddf1ebdbc03765b68850f1420861954","last_reissued_at":"2026-05-17T23:49:30.352281Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:49:30.352281Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1904.01655","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:49:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/ythV8ISQdkw/qkAU6vXCPHLYAninTW6o55HfT8K+6zL5oh8xOUk27axhgpO4r/J0+rsKBSRui1KlEtLKsQ1Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-27T22:04:41.265245Z"},"content_sha256":"13752260ad9c3eb5943c44d5cf8df0c5ed573e77720645374a4b4516885faf2b","schema_version":"1.0","event_id":"sha256:13752260ad9c3eb5943c44d5cf8df0c5ed573e77720645374a4b4516885faf2b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:R7EGEVLGK463WXZX75EOBHEWRC","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A frame semantic overview of NLP-based information extraction for cancer-related EHR notes","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"q-bio.QM","authors_text":"Elmer V Bernstam, Kirk Roberts, Surabhi Datta","submitted_at":"2019-04-02T20:27:42Z","abstract_excerpt":"Objective: There is a lot of information about cancer in Electronic Health Record (EHR) notes that can be useful for biomedical research provided natural language processing (NLP) methods are available to extract and structure this information. In this paper, we present a scoping review of existing clinical NLP literature for cancer. Methods: We identified studies describing an NLP method to extract specific cancer-related information from EHR sources from PubMed, Google Scholar, ACL Anthology, and existing reviews. Two exclusion criteria were used in this study. We excluded articles where the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.01655","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:49:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yvBCWVB/5jw4EEcc314nHnSdobUI+rvO9ztFCmq+v4fdtpugNDfbd9FqnGZBUftMzbaQ5GBF1FeGhSjhu3W9Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-27T22:04:41.265606Z"},"content_sha256":"6099ee8ea7a619ade78be56f879195ef55f9d5a4f6dcb65c96fe26620aada15a","schema_version":"1.0","event_id":"sha256:6099ee8ea7a619ade78be56f879195ef55f9d5a4f6dcb65c96fe26620aada15a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/R7EGEVLGK463WXZX75EOBHEWRC/bundle.json","state_url":"https://pith.science/pith/R7EGEVLGK463WXZX75EOBHEWRC/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/R7EGEVLGK463WXZX75EOBHEWRC/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-27T22:04:41Z","links":{"resolver":"https://pith.science/pith/R7EGEVLGK463WXZX75EOBHEWRC","bundle":"https://pith.science/pith/R7EGEVLGK463WXZX75EOBHEWRC/bundle.json","state":"https://pith.science/pith/R7EGEVLGK463WXZX75EOBHEWRC/state.json","well_known_bundle":"https://pith.science/.well-known/pith/R7EGEVLGK463WXZX75EOBHEWRC/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:R7EGEVLGK463WXZX75EOBHEWRC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"98cf058437a977afd9cddfe73c7468d8a8441dee8121b638960d3b932d1267de","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-04-02T20:27:42Z","title_canon_sha256":"e82b9c984be3d90c152b2423da3b0658e941c51f17f01965ad465754ffc6b253"},"schema_version":"1.0","source":{"id":"1904.01655","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.01655","created_at":"2026-05-17T23:49:30Z"},{"alias_kind":"arxiv_version","alias_value":"1904.01655v1","created_at":"2026-05-17T23:49:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.01655","created_at":"2026-05-17T23:49:30Z"},{"alias_kind":"pith_short_12","alias_value":"R7EGEVLGK463","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"R7EGEVLGK463WXZX","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"R7EGEVLG","created_at":"2026-05-18T12:33:27Z"}],"graph_snapshots":[{"event_id":"sha256:6099ee8ea7a619ade78be56f879195ef55f9d5a4f6dcb65c96fe26620aada15a","target":"graph","created_at":"2026-05-17T23:49:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Objective: There is a lot of information about cancer in Electronic Health Record (EHR) notes that can be useful for biomedical research provided natural language processing (NLP) methods are available to extract and structure this information. In this paper, we present a scoping review of existing clinical NLP literature for cancer. Methods: We identified studies describing an NLP method to extract specific cancer-related information from EHR sources from PubMed, Google Scholar, ACL Anthology, and existing reviews. Two exclusion criteria were used in this study. We excluded articles where the","authors_text":"Elmer V Bernstam, Kirk Roberts, Surabhi Datta","cross_cats":["cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-04-02T20:27:42Z","title":"A frame semantic overview of NLP-based information extraction for cancer-related EHR notes"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.01655","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:13752260ad9c3eb5943c44d5cf8df0c5ed573e77720645374a4b4516885faf2b","target":"record","created_at":"2026-05-17T23:49:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"98cf058437a977afd9cddfe73c7468d8a8441dee8121b638960d3b932d1267de","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-04-02T20:27:42Z","title_canon_sha256":"e82b9c984be3d90c152b2423da3b0658e941c51f17f01965ad465754ffc6b253"},"schema_version":"1.0","source":{"id":"1904.01655","kind":"arxiv","version":1}},"canonical_sha256":"8fc8625566573dbb5f37ff48e09c96888ddf1ebdbc03765b68850f1420861954","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8fc8625566573dbb5f37ff48e09c96888ddf1ebdbc03765b68850f1420861954","first_computed_at":"2026-05-17T23:49:30.352281Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:49:30.352281Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"eIQqryPHYYtxi72wrhYq/5IK1rWQaqjv49b8OZID7HMVtc0l8NCDBJtXuR/0q47zqIoLCBY7CruD5Xv9lOphCg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:49:30.352986Z","signed_message":"canonical_sha256_bytes"},"source_id":"1904.01655","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:13752260ad9c3eb5943c44d5cf8df0c5ed573e77720645374a4b4516885faf2b","sha256:6099ee8ea7a619ade78be56f879195ef55f9d5a4f6dcb65c96fe26620aada15a"],"state_sha256":"6c0852320baedb77c03a053858422730ac1701e1bd533c5e53717b7387256aa3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SGbjnW9LrAZP5lWNcyZJT+uXCK4YHZkGIG9FruN+0yMb35cXPMLTklbmaLYZIA7fQy+IsHlte+3SX9cPNyGnDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-27T22:04:41.267442Z","bundle_sha256":"90f480fba7f7adff066fdf432354f44eedff8f1e4038228347a1612a421674b2"}}