{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:JWNFNHVVI6VJKTJOU3Q3GQDI4G","short_pith_number":"pith:JWNFNHVV","canonical_record":{"source":{"id":"1711.04411","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-13T03:47:52Z","cross_cats_sorted":[],"title_canon_sha256":"ced2840338d0d6680c08f0471311c6ad446550b5381bdaa12d01a186c0527184","abstract_canon_sha256":"659ca988e34b076927dc527ca55ff55dc6aca609f1ba8f845f0b20d99dde8f9b"},"schema_version":"1.0"},"canonical_sha256":"4d9a569eb547aa954d2ea6e1b34068e1ae749d46d1479660724c4cbc8f38cabe","source":{"kind":"arxiv","id":"1711.04411","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.04411","created_at":"2026-05-18T00:30:39Z"},{"alias_kind":"arxiv_version","alias_value":"1711.04411v1","created_at":"2026-05-18T00:30:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.04411","created_at":"2026-05-18T00:30:39Z"},{"alias_kind":"pith_short_12","alias_value":"JWNFNHVVI6VJ","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_16","alias_value":"JWNFNHVVI6VJKTJO","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_8","alias_value":"JWNFNHVV","created_at":"2026-05-18T12:31:24Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:JWNFNHVVI6VJKTJOU3Q3GQDI4G","target":"record","payload":{"canonical_record":{"source":{"id":"1711.04411","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-13T03:47:52Z","cross_cats_sorted":[],"title_canon_sha256":"ced2840338d0d6680c08f0471311c6ad446550b5381bdaa12d01a186c0527184","abstract_canon_sha256":"659ca988e34b076927dc527ca55ff55dc6aca609f1ba8f845f0b20d99dde8f9b"},"schema_version":"1.0"},"canonical_sha256":"4d9a569eb547aa954d2ea6e1b34068e1ae749d46d1479660724c4cbc8f38cabe","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:30:39.123434Z","signature_b64":"N8YfRhhJ1dB8aOfJ9Yk/sPWeUz81G6SVYTbUL7j0EyU2FZbpzYSkV4CMQuv1QuEuI8OcYnca55f44nksDS98BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4d9a569eb547aa954d2ea6e1b34068e1ae749d46d1479660724c4cbc8f38cabe","last_reissued_at":"2026-05-18T00:30:39.122766Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:30:39.122766Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1711.04411","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:30:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"i8HW9FPey2a/bQi/33wKMKZKZNxcozE3XzHwh8gq+viv1iBMpCbEiIAkUtA44Rxgcdpzl24ECo1mQGILLo/nDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-05T19:08:50.688127Z"},"content_sha256":"ec67c348d97c6a20b81306eb24b44db317bdd42493e50341885d6e0ee4a9b70d","schema_version":"1.0","event_id":"sha256:ec67c348d97c6a20b81306eb24b44db317bdd42493e50341885d6e0ee4a9b70d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:JWNFNHVVI6VJKTJOU3Q3GQDI4G","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Convolutional Neural Network with Word Embeddings for Chinese Word Segmentation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Bo Xu, Chunqi Wang","submitted_at":"2017-11-13T03:47:52Z","abstract_excerpt":"Character-based sequence labeling framework is flexible and efficient for Chinese word segmentation (CWS). Recently, many character-based neural models have been applied to CWS. While they obtain good performance, they have two obvious weaknesses. The first is that they heavily rely on manually designed bigram feature, i.e. they are not good at capturing n-gram features automatically. The second is that they make no use of full word information. For the first weakness, we propose a convolutional neural model, which is able to capture rich n-gram features without any feature engineering. For th"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.04411","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:30:39Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KQZs8A3OyGTn6atHtvmXUymBcOQdK8CTp4FueNBAL7VRCUpPOouyoQzHveepbhbiiFob9QErpkM6D1PBnqhLDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-05T19:08:50.688761Z"},"content_sha256":"2b2453e0dc9cf834647bd142ae44ef52eef9cc4344b54623a06214c31124f2f4","schema_version":"1.0","event_id":"sha256:2b2453e0dc9cf834647bd142ae44ef52eef9cc4344b54623a06214c31124f2f4"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G/bundle.json","state_url":"https://pith.science/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-05T19:08:50Z","links":{"resolver":"https://pith.science/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G","bundle":"https://pith.science/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G/bundle.json","state":"https://pith.science/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JWNFNHVVI6VJKTJOU3Q3GQDI4G/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:JWNFNHVVI6VJKTJOU3Q3GQDI4G","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"659ca988e34b076927dc527ca55ff55dc6aca609f1ba8f845f0b20d99dde8f9b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-13T03:47:52Z","title_canon_sha256":"ced2840338d0d6680c08f0471311c6ad446550b5381bdaa12d01a186c0527184"},"schema_version":"1.0","source":{"id":"1711.04411","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.04411","created_at":"2026-05-18T00:30:39Z"},{"alias_kind":"arxiv_version","alias_value":"1711.04411v1","created_at":"2026-05-18T00:30:39Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.04411","created_at":"2026-05-18T00:30:39Z"},{"alias_kind":"pith_short_12","alias_value":"JWNFNHVVI6VJ","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_16","alias_value":"JWNFNHVVI6VJKTJO","created_at":"2026-05-18T12:31:24Z"},{"alias_kind":"pith_short_8","alias_value":"JWNFNHVV","created_at":"2026-05-18T12:31:24Z"}],"graph_snapshots":[{"event_id":"sha256:2b2453e0dc9cf834647bd142ae44ef52eef9cc4344b54623a06214c31124f2f4","target":"graph","created_at":"2026-05-18T00:30:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Character-based sequence labeling framework is flexible and efficient for Chinese word segmentation (CWS). Recently, many character-based neural models have been applied to CWS. While they obtain good performance, they have two obvious weaknesses. The first is that they heavily rely on manually designed bigram feature, i.e. they are not good at capturing n-gram features automatically. The second is that they make no use of full word information. For the first weakness, we propose a convolutional neural model, which is able to capture rich n-gram features without any feature engineering. For th","authors_text":"Bo Xu, Chunqi Wang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-13T03:47:52Z","title":"Convolutional Neural Network with Word Embeddings for Chinese Word Segmentation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.04411","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ec67c348d97c6a20b81306eb24b44db317bdd42493e50341885d6e0ee4a9b70d","target":"record","created_at":"2026-05-18T00:30:39Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"659ca988e34b076927dc527ca55ff55dc6aca609f1ba8f845f0b20d99dde8f9b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-13T03:47:52Z","title_canon_sha256":"ced2840338d0d6680c08f0471311c6ad446550b5381bdaa12d01a186c0527184"},"schema_version":"1.0","source":{"id":"1711.04411","kind":"arxiv","version":1}},"canonical_sha256":"4d9a569eb547aa954d2ea6e1b34068e1ae749d46d1479660724c4cbc8f38cabe","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4d9a569eb547aa954d2ea6e1b34068e1ae749d46d1479660724c4cbc8f38cabe","first_computed_at":"2026-05-18T00:30:39.122766Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:30:39.122766Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"N8YfRhhJ1dB8aOfJ9Yk/sPWeUz81G6SVYTbUL7j0EyU2FZbpzYSkV4CMQuv1QuEuI8OcYnca55f44nksDS98BQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:30:39.123434Z","signed_message":"canonical_sha256_bytes"},"source_id":"1711.04411","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ec67c348d97c6a20b81306eb24b44db317bdd42493e50341885d6e0ee4a9b70d","sha256:2b2453e0dc9cf834647bd142ae44ef52eef9cc4344b54623a06214c31124f2f4"],"state_sha256":"4397fa7c9b959a6df61650249a381e66bca71391941c8e348914d6fbd52eaa04"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kOS5xSRoIYBAJDMut1jGHnu8CkjX+UmCshxCfJNBN7nKTdS5LMO4LqNPiez/c5+mlzX7eusQbx3FZYQSOxjhBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-05T19:08:50.692018Z","bundle_sha256":"cf1f05bd695ca0981b2049e419a185b4227664ae5a911583816bc406223be826"}}