{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:DMT6MKATDZLHMXOSM4GUNHCBGM","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e728cbcb6b07c27b48723db598e1a190be674b3ce401ac8f1915eedd4d92c35f","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-03-09T09:46:56Z","title_canon_sha256":"3e8eb13e1a9181a41e5fd7cec849da5081a34d3af3a0a5a7b35fcc88ea2451b9"},"schema_version":"1.0","source":{"id":"1703.03200","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.03200","created_at":"2026-05-18T00:48:59Z"},{"alias_kind":"arxiv_version","alias_value":"1703.03200v2","created_at":"2026-05-18T00:48:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.03200","created_at":"2026-05-18T00:48:59Z"},{"alias_kind":"pith_short_12","alias_value":"DMT6MKATDZLH","created_at":"2026-05-18T12:31:12Z"},{"alias_kind":"pith_short_16","alias_value":"DMT6MKATDZLHMXOS","created_at":"2026-05-18T12:31:12Z"},{"alias_kind":"pith_short_8","alias_value":"DMT6MKAT","created_at":"2026-05-18T12:31:12Z"}],"graph_snapshots":[{"event_id":"sha256:1af0a70a2221ea883c2c895076daf197debdfbfb1153ac57689fda586b819f1c","target":"graph","created_at":"2026-05-18T00:48:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Sparsity is one of the major problems in natural language processing. The problem becomes even more severe in agglutinating languages that are highly prone to be inflected. We deal with sparsity in Turkish by adopting morphological features for part-of-speech tagging. We learn inflectional and derivational morpheme tags in Turkish by using conditional random fields (CRF) and we employ the morpheme tags in part-of-speech (PoS) tagging by using hidden Markov models (HMMs) to mitigate sparsity. Results show that using morpheme tags in PoS tagging helps alleviate the sparsity in emission probabili","authors_text":"Ahmet \\\"Ust\\\"un, Burcu Can, Murathan Kurfal{\\i}","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-03-09T09:46:56Z","title":"Turkish PoS Tagging by Reducing Sparsity with Morpheme Tags in Small Datasets"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.03200","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f51f2481353f603903fd05b4c14afdc55f04a9c9b186b3bb319a8c055071909e","target":"record","created_at":"2026-05-18T00:48:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e728cbcb6b07c27b48723db598e1a190be674b3ce401ac8f1915eedd4d92c35f","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-03-09T09:46:56Z","title_canon_sha256":"3e8eb13e1a9181a41e5fd7cec849da5081a34d3af3a0a5a7b35fcc88ea2451b9"},"schema_version":"1.0","source":{"id":"1703.03200","kind":"arxiv","version":2}},"canonical_sha256":"1b27e628131e56765dd2670d469c413305ef15a9ffde0e7d4ba78f6e2a44c070","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1b27e628131e56765dd2670d469c413305ef15a9ffde0e7d4ba78f6e2a44c070","first_computed_at":"2026-05-18T00:48:59.153184Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:48:59.153184Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"mSdXMOKR+IOrFtH6z2nvCMQc7jj/S/PTD2GYBh7x8M0tYoj7t/bpvTA1ErMXclVuM4VDz1gUW6L3jR9zeHueDg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:48:59.153746Z","signed_message":"canonical_sha256_bytes"},"source_id":"1703.03200","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f51f2481353f603903fd05b4c14afdc55f04a9c9b186b3bb319a8c055071909e","sha256:1af0a70a2221ea883c2c895076daf197debdfbfb1153ac57689fda586b819f1c"],"state_sha256":"417bd54b9e0dceffc4fdc13ba201414c9c64cf337b5398725696d2e66c3070fd"}