{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:K67DYZLM5XWFC5DKCLOZB42H6R","short_pith_number":"pith:K67DYZLM","canonical_record":{"source":{"id":"1705.08154","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2017-05-23T09:36:41Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"24df58789c641815ca7bbd4f19c05ed8fa0a554f115bdc015d07dbb55c62bcda","abstract_canon_sha256":"e8ae88b21f94adc1b0f912a781748b70b287dc682e52716d757783a26a77128f"},"schema_version":"1.0"},"canonical_sha256":"57be3c656cedec51746a12dd90f347f45e63b91891fe1674f32386620448bb39","source":{"kind":"arxiv","id":"1705.08154","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.08154","created_at":"2026-05-18T00:43:49Z"},{"alias_kind":"arxiv_version","alias_value":"1705.08154v1","created_at":"2026-05-18T00:43:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.08154","created_at":"2026-05-18T00:43:49Z"},{"alias_kind":"pith_short_12","alias_value":"K67DYZLM5XWF","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_16","alias_value":"K67DYZLM5XWFC5DK","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_8","alias_value":"K67DYZLM","created_at":"2026-05-18T12:31:24Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:K67DYZLM5XWFC5DKCLOZB42H6R","target":"record","payload":{"canonical_record":{"source":{"id":"1705.08154","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2017-05-23T09:36:41Z","cross_cats_sorted":["cs.DL"],"title_canon_sha256":"24df58789c641815ca7bbd4f19c05ed8fa0a554f115bdc015d07dbb55c62bcda","abstract_canon_sha256":"e8ae88b21f94adc1b0f912a781748b70b287dc682e52716d757783a26a77128f"},"schema_version":"1.0"},"canonical_sha256":"57be3c656cedec51746a12dd90f347f45e63b91891fe1674f32386620448bb39","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:43:49.195219Z","signature_b64":"+0ZfQuBHSLe7zSh5UzEVTsfKZcsXFL1+neUYK+W57L0K/ttaUp5E7w/j9vsepEWNXtKQpgtdYKvMX+s6IF1ADg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"57be3c656cedec51746a12dd90f347f45e63b91891fe1674f32386620448bb39","last_reissued_at":"2026-05-18T00:43:49.194597Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:43:49.194597Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1705.08154","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:43:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RNHJ7vpBB3JAmGbIelee/BBtVBnI+dfgRlZNdGYvNTdhj+CaqZYLv2F+tFrMok0PJsGpN344lEcmaFet9aRmAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T15:27:26.651146Z"},"content_sha256":"f2c1dcbbf59e9fb38f0822f1871f07286f49495d87c3462f29b350915f5b3017","schema_version":"1.0","event_id":"sha256:f2c1dcbbf59e9fb38f0822f1871f07286f49495d87c3462f29b350915f5b3017"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:K67DYZLM5XWFC5DKCLOZB42H6R","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Reference String Extraction Using Line-Based Conditional Random Fields","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":["cs.DL"],"primary_cat":"cs.IR","authors_text":"Martin K\\\"orner","submitted_at":"2017-05-23T09:36:41Z","abstract_excerpt":"The extraction of individual reference strings from the reference section of scientific publications is an important step in the citation extraction pipeline. Current approaches divide this task into two steps by first detecting the reference section areas and then grouping the text lines in such areas into reference strings. We propose a classification model that considers every line in a publication as a potential part of a reference string. By applying line-based conditional random fields rather than constructing the graphical model based on the individual words, dependencies and patterns t"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.08154","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:43:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MlAKI51RpXDWItezr7yebioNHTGuCybdlSdjuPyLK1f4mKCR87vRgZn1F0MHDpXjp9fSoMQs8BYpHYJnyzUeDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T15:27:26.651570Z"},"content_sha256":"07809099dcc5c411f2b797f5222f758e470c93d1d0b6420935fb5bf5462e83a8","schema_version":"1.0","event_id":"sha256:07809099dcc5c411f2b797f5222f758e470c93d1d0b6420935fb5bf5462e83a8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/K67DYZLM5XWFC5DKCLOZB42H6R/bundle.json","state_url":"https://pith.science/pith/K67DYZLM5XWFC5DKCLOZB42H6R/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/K67DYZLM5XWFC5DKCLOZB42H6R/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T15:27:26Z","links":{"resolver":"https://pith.science/pith/K67DYZLM5XWFC5DKCLOZB42H6R","bundle":"https://pith.science/pith/K67DYZLM5XWFC5DKCLOZB42H6R/bundle.json","state":"https://pith.science/pith/K67DYZLM5XWFC5DKCLOZB42H6R/state.json","well_known_bundle":"https://pith.science/.well-known/pith/K67DYZLM5XWFC5DKCLOZB42H6R/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:K67DYZLM5XWFC5DKCLOZB42H6R","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e8ae88b21f94adc1b0f912a781748b70b287dc682e52716d757783a26a77128f","cross_cats_sorted":["cs.DL"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2017-05-23T09:36:41Z","title_canon_sha256":"24df58789c641815ca7bbd4f19c05ed8fa0a554f115bdc015d07dbb55c62bcda"},"schema_version":"1.0","source":{"id":"1705.08154","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.08154","created_at":"2026-05-18T00:43:49Z"},{"alias_kind":"arxiv_version","alias_value":"1705.08154v1","created_at":"2026-05-18T00:43:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.08154","created_at":"2026-05-18T00:43:49Z"},{"alias_kind":"pith_short_12","alias_value":"K67DYZLM5XWF","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_16","alias_value":"K67DYZLM5XWFC5DK","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_8","alias_value":"K67DYZLM","created_at":"2026-05-18T12:31:24Z"}],"graph_snapshots":[{"event_id":"sha256:07809099dcc5c411f2b797f5222f758e470c93d1d0b6420935fb5bf5462e83a8","target":"graph","created_at":"2026-05-18T00:43:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The extraction of individual reference strings from the reference section of scientific publications is an important step in the citation extraction pipeline. Current approaches divide this task into two steps by first detecting the reference section areas and then grouping the text lines in such areas into reference strings. We propose a classification model that considers every line in a publication as a potential part of a reference string. By applying line-based conditional random fields rather than constructing the graphical model based on the individual words, dependencies and patterns t","authors_text":"Martin K\\\"orner","cross_cats":["cs.DL"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2017-05-23T09:36:41Z","title":"Reference String Extraction Using Line-Based Conditional Random Fields"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.08154","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f2c1dcbbf59e9fb38f0822f1871f07286f49495d87c3462f29b350915f5b3017","target":"record","created_at":"2026-05-18T00:43:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e8ae88b21f94adc1b0f912a781748b70b287dc682e52716d757783a26a77128f","cross_cats_sorted":["cs.DL"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2017-05-23T09:36:41Z","title_canon_sha256":"24df58789c641815ca7bbd4f19c05ed8fa0a554f115bdc015d07dbb55c62bcda"},"schema_version":"1.0","source":{"id":"1705.08154","kind":"arxiv","version":1}},"canonical_sha256":"57be3c656cedec51746a12dd90f347f45e63b91891fe1674f32386620448bb39","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"57be3c656cedec51746a12dd90f347f45e63b91891fe1674f32386620448bb39","first_computed_at":"2026-05-18T00:43:49.194597Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:43:49.194597Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+0ZfQuBHSLe7zSh5UzEVTsfKZcsXFL1+neUYK+W57L0K/ttaUp5E7w/j9vsepEWNXtKQpgtdYKvMX+s6IF1ADg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:43:49.195219Z","signed_message":"canonical_sha256_bytes"},"source_id":"1705.08154","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f2c1dcbbf59e9fb38f0822f1871f07286f49495d87c3462f29b350915f5b3017","sha256:07809099dcc5c411f2b797f5222f758e470c93d1d0b6420935fb5bf5462e83a8"],"state_sha256":"64a754c118efbdf3ee9da80314ec5fb9436511fbe1382b5220115f8b71e21542"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kR7QKgdxQQ77Dsb8dT64T/qRuqUuaQzzbalfylbRkZxWDLSFEcQErEX9TvtzSKSqowjta7ty0OoOI5pNlNKOCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T15:27:26.653747Z","bundle_sha256":"9f9422060020b0d2482456722713bea6a5b4b06d3268d1c6f9c76022e8e63033"}}