{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:ZQAOUOANUWZQEPBPNXNSB7XUIJ","short_pith_number":"pith:ZQAOUOAN","canonical_record":{"source":{"id":"1701.08702","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-01-27T18:43:31Z","cross_cats_sorted":[],"title_canon_sha256":"8539fc175b90a1b8a9204af66168c78054efb07dfc60c188d1c8709b159bcbe9","abstract_canon_sha256":"038d541c44cea8902919dc7e7e2438713b266b84190558c5adcdd64deaec0f5a"},"schema_version":"1.0"},"canonical_sha256":"cc00ea380da5b3023c2f6ddb20fef44241dfeeca2498c6d012f53b20e47fa38b","source":{"kind":"arxiv","id":"1701.08702","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1701.08702","created_at":"2026-05-18T00:51:52Z"},{"alias_kind":"arxiv_version","alias_value":"1701.08702v1","created_at":"2026-05-18T00:51:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1701.08702","created_at":"2026-05-18T00:51:52Z"},{"alias_kind":"pith_short_12","alias_value":"ZQAOUOANUWZQ","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_16","alias_value":"ZQAOUOANUWZQEPBP","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_8","alias_value":"ZQAOUOAN","created_at":"2026-05-18T12:31:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:ZQAOUOANUWZQEPBPNXNSB7XUIJ","target":"record","payload":{"canonical_record":{"source":{"id":"1701.08702","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-01-27T18:43:31Z","cross_cats_sorted":[],"title_canon_sha256":"8539fc175b90a1b8a9204af66168c78054efb07dfc60c188d1c8709b159bcbe9","abstract_canon_sha256":"038d541c44cea8902919dc7e7e2438713b266b84190558c5adcdd64deaec0f5a"},"schema_version":"1.0"},"canonical_sha256":"cc00ea380da5b3023c2f6ddb20fef44241dfeeca2498c6d012f53b20e47fa38b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:51:52.924763Z","signature_b64":"P9u+uKVav22ocS8D5w82AnAloDKhGg9JQNE/Y0BfdcJ9YXfLhI6Gwh28nWr7cdTs6mF9QZbmNaiQW+1DJlx0Dg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"cc00ea380da5b3023c2f6ddb20fef44241dfeeca2498c6d012f53b20e47fa38b","last_reissued_at":"2026-05-18T00:51:52.924116Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:51:52.924116Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1701.08702","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:51:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oa8eZdS6L/Qgo3/1pCVr3TZo6Pwj6tGHZQvSrIjcfB6ubhX7wtSiHlV9YnvWmVisy5NDGA+/FE1OWdaFd+/KDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-25T18:58:04.582904Z"},"content_sha256":"a68ef074ae77ebd07c1dc892a759076bf688594c400ed57e516dd3df199da2b7","schema_version":"1.0","event_id":"sha256:a68ef074ae77ebd07c1dc892a759076bf688594c400ed57e516dd3df199da2b7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:ZQAOUOANUWZQEPBPNXNSB7XUIJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Bangla Word Clustering Based on Tri-gram, 4-gram and 5-gram Language Model","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Dipaloke Saha, Md Saddam Hossain, Md. Saiful Islam, Sabir Ismail","submitted_at":"2017-01-27T18:43:31Z","abstract_excerpt":"In this paper, we describe a research method that generates Bangla word clusters on the basis of relating to meaning in language and contextual similarity. The importance of word clustering is in parts of speech (POS) tagging, word sense disambiguation, text classification, recommender system, spell checker, grammar checker, knowledge discover and for many others Natural Language Processing (NLP) applications. In the history of word clustering, English and some other languages have already implemented some methods on word clustering efficiently. But due to lack of the resources, word clusterin"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1701.08702","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:51:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"iYUPtRljhIoSdh/oZayJr1j3tpCFduil7lkz+HEVx6UC4v8nDdKLELxsS4B3LOR88x0YvlgOXAtrAS97PDWOAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-25T18:58:04.583235Z"},"content_sha256":"726fc2d390a18eefabe3181a61fd34acaae630ef349e4fa0621cfe37e1705801","schema_version":"1.0","event_id":"sha256:726fc2d390a18eefabe3181a61fd34acaae630ef349e4fa0621cfe37e1705801"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ/bundle.json","state_url":"https://pith.science/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-25T18:58:04Z","links":{"resolver":"https://pith.science/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ","bundle":"https://pith.science/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ/bundle.json","state":"https://pith.science/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ZQAOUOANUWZQEPBPNXNSB7XUIJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:ZQAOUOANUWZQEPBPNXNSB7XUIJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"038d541c44cea8902919dc7e7e2438713b266b84190558c5adcdd64deaec0f5a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-01-27T18:43:31Z","title_canon_sha256":"8539fc175b90a1b8a9204af66168c78054efb07dfc60c188d1c8709b159bcbe9"},"schema_version":"1.0","source":{"id":"1701.08702","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1701.08702","created_at":"2026-05-18T00:51:52Z"},{"alias_kind":"arxiv_version","alias_value":"1701.08702v1","created_at":"2026-05-18T00:51:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1701.08702","created_at":"2026-05-18T00:51:52Z"},{"alias_kind":"pith_short_12","alias_value":"ZQAOUOANUWZQ","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_16","alias_value":"ZQAOUOANUWZQEPBP","created_at":"2026-05-18T12:31:59Z"},{"alias_kind":"pith_short_8","alias_value":"ZQAOUOAN","created_at":"2026-05-18T12:31:59Z"}],"graph_snapshots":[{"event_id":"sha256:726fc2d390a18eefabe3181a61fd34acaae630ef349e4fa0621cfe37e1705801","target":"graph","created_at":"2026-05-18T00:51:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we describe a research method that generates Bangla word clusters on the basis of relating to meaning in language and contextual similarity. The importance of word clustering is in parts of speech (POS) tagging, word sense disambiguation, text classification, recommender system, spell checker, grammar checker, knowledge discover and for many others Natural Language Processing (NLP) applications. In the history of word clustering, English and some other languages have already implemented some methods on word clustering efficiently. But due to lack of the resources, word clusterin","authors_text":"Dipaloke Saha, Md Saddam Hossain, Md. Saiful Islam, Sabir Ismail","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-01-27T18:43:31Z","title":"Bangla Word Clustering Based on Tri-gram, 4-gram and 5-gram Language Model"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1701.08702","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a68ef074ae77ebd07c1dc892a759076bf688594c400ed57e516dd3df199da2b7","target":"record","created_at":"2026-05-18T00:51:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"038d541c44cea8902919dc7e7e2438713b266b84190558c5adcdd64deaec0f5a","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-01-27T18:43:31Z","title_canon_sha256":"8539fc175b90a1b8a9204af66168c78054efb07dfc60c188d1c8709b159bcbe9"},"schema_version":"1.0","source":{"id":"1701.08702","kind":"arxiv","version":1}},"canonical_sha256":"cc00ea380da5b3023c2f6ddb20fef44241dfeeca2498c6d012f53b20e47fa38b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"cc00ea380da5b3023c2f6ddb20fef44241dfeeca2498c6d012f53b20e47fa38b","first_computed_at":"2026-05-18T00:51:52.924116Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:51:52.924116Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"P9u+uKVav22ocS8D5w82AnAloDKhGg9JQNE/Y0BfdcJ9YXfLhI6Gwh28nWr7cdTs6mF9QZbmNaiQW+1DJlx0Dg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:51:52.924763Z","signed_message":"canonical_sha256_bytes"},"source_id":"1701.08702","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a68ef074ae77ebd07c1dc892a759076bf688594c400ed57e516dd3df199da2b7","sha256:726fc2d390a18eefabe3181a61fd34acaae630ef349e4fa0621cfe37e1705801"],"state_sha256":"6d0a90f56642dd31f1a825fc47b93fb036758f369760a4c41643f12d51bcc380"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QMjpP1SNmqKiucDQTDmljgQRVM28vCpT+rthEOIHUNwuxUKs1nlKyelmRibwiWY2I+iNjCLlAGZc9nWJoxHoDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-25T18:58:04.585118Z","bundle_sha256":"0c0e8fadf0710a6e96cfd41e02e089b8154e4cb4de2718c15fc3ac7a3661e197"}}