{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:GGTX562DP5ZUM7XIELHM5NLBJC","short_pith_number":"pith:GGTX562D","schema_version":"1.0","canonical_sha256":"31a77efb437f73467ee822ceceb5614898dd251da7bced039b76b5f458df5424","source":{"kind":"arxiv","id":"1705.04789","version":1},"attestation_state":"computed","paper":{"title":"Scalable and Efficient Construction of Suffix Array with MapReduce and In-Memory Data Store System","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Chien-Min Wang, Hsiang-Huang Wu, Hsuan-Chi Kuo, Jan-Ming Ho, Wei-Chun Chung","submitted_at":"2017-05-13T04:47:44Z","abstract_excerpt":"Suffix Array (SA) is a cardinal data structure in many pattern matching applications, including data compression, plagiarism detection and sequence alignment. However, as the volumes of data increase abruptly, the construction of SA is not amenable to the current large-scale data processing frameworks anymore due to its intrinsic proliferation of suffixes during the construction. That is, ameliorating the performance by just adding the resources to the frameworks becomes less cost- effective, even having the severe diminishing returns. At issue now is whether we can permit SA construction to b"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1705.04789","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2017-05-13T04:47:44Z","cross_cats_sorted":[],"title_canon_sha256":"1b2b7d9782f7c6264c24f5f72980ff0aec419c2ec6d8617e307c27784bfa5477","abstract_canon_sha256":"2b43b67e812816351c57c2a7c2b7acf3c7af016630edb60a523af8d83e94242f"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:44:34.629119Z","signature_b64":"mRBD2bGTijejFN2L7Hk31uTPX0Re327iLLaUaN2P5SPdXtW70N83NZ4gDv1cuPgYWeGoMwcGdMHpwVs1zVgdAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"31a77efb437f73467ee822ceceb5614898dd251da7bced039b76b5f458df5424","last_reissued_at":"2026-05-18T00:44:34.628606Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:44:34.628606Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Scalable and Efficient Construction of Suffix Array with MapReduce and In-Memory Data Store System","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Chien-Min Wang, Hsiang-Huang Wu, Hsuan-Chi Kuo, Jan-Ming Ho, Wei-Chun Chung","submitted_at":"2017-05-13T04:47:44Z","abstract_excerpt":"Suffix Array (SA) is a cardinal data structure in many pattern matching applications, including data compression, plagiarism detection and sequence alignment. However, as the volumes of data increase abruptly, the construction of SA is not amenable to the current large-scale data processing frameworks anymore due to its intrinsic proliferation of suffixes during the construction. That is, ameliorating the performance by just adding the resources to the frameworks becomes less cost- effective, even having the severe diminishing returns. At issue now is whether we can permit SA construction to b"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.04789","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1705.04789","created_at":"2026-05-18T00:44:34.628704+00:00"},{"alias_kind":"arxiv_version","alias_value":"1705.04789v1","created_at":"2026-05-18T00:44:34.628704+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.04789","created_at":"2026-05-18T00:44:34.628704+00:00"},{"alias_kind":"pith_short_12","alias_value":"GGTX562DP5ZU","created_at":"2026-05-18T12:31:15.632608+00:00"},{"alias_kind":"pith_short_16","alias_value":"GGTX562DP5ZUM7XI","created_at":"2026-05-18T12:31:15.632608+00:00"},{"alias_kind":"pith_short_8","alias_value":"GGTX562D","created_at":"2026-05-18T12:31:15.632608+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC","json":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC.json","graph_json":"https://pith.science/api/pith-number/GGTX562DP5ZUM7XIELHM5NLBJC/graph.json","events_json":"https://pith.science/api/pith-number/GGTX562DP5ZUM7XIELHM5NLBJC/events.json","paper":"https://pith.science/paper/GGTX562D"},"agent_actions":{"view_html":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC","download_json":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC.json","view_paper":"https://pith.science/paper/GGTX562D","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1705.04789&json=true","fetch_graph":"https://pith.science/api/pith-number/GGTX562DP5ZUM7XIELHM5NLBJC/graph.json","fetch_events":"https://pith.science/api/pith-number/GGTX562DP5ZUM7XIELHM5NLBJC/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC/action/timestamp_anchor","attest_storage":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC/action/storage_attestation","attest_author":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC/action/author_attestation","sign_citation":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC/action/citation_signature","submit_replication":"https://pith.science/pith/GGTX562DP5ZUM7XIELHM5NLBJC/action/replication_record"}},"created_at":"2026-05-18T00:44:34.628704+00:00","updated_at":"2026-05-18T00:44:34.628704+00:00"}