{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2014:SH6EA2WZRSD27ZOLLA574TBVYJ","short_pith_number":"pith:SH6EA2WZ","canonical_record":{"source":{"id":"1407.4908","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.DC","submitted_at":"2014-07-18T08:17:55Z","cross_cats_sorted":[],"title_canon_sha256":"f2bdce76e4bf7b9d79de8d9ad47e249aa1f0650ecdc0545c6b2192c577c642c0","abstract_canon_sha256":"9ad99b0e6cf13b6c1879b7ea1b82765a0bfb9f563d25c429a899c1bc6d05a7d7"},"schema_version":"1.0"},"canonical_sha256":"91fc406ad98c87afe5cb583bfe4c35c257ce5f1c120b3d25d2f1aa54ddf5ed37","source":{"kind":"arxiv","id":"1407.4908","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1407.4908","created_at":"2026-05-18T00:24:04Z"},{"alias_kind":"arxiv_version","alias_value":"1407.4908v1","created_at":"2026-05-18T00:24:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1407.4908","created_at":"2026-05-18T00:24:04Z"},{"alias_kind":"pith_short_12","alias_value":"SH6EA2WZRSD2","created_at":"2026-05-18T12:28:49Z"},{"alias_kind":"pith_short_16","alias_value":"SH6EA2WZRSD27ZOL","created_at":"2026-05-18T12:28:49Z"},{"alias_kind":"pith_short_8","alias_value":"SH6EA2WZ","created_at":"2026-05-18T12:28:49Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2014:SH6EA2WZRSD27ZOLLA574TBVYJ","target":"record","payload":{"canonical_record":{"source":{"id":"1407.4908","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.DC","submitted_at":"2014-07-18T08:17:55Z","cross_cats_sorted":[],"title_canon_sha256":"f2bdce76e4bf7b9d79de8d9ad47e249aa1f0650ecdc0545c6b2192c577c642c0","abstract_canon_sha256":"9ad99b0e6cf13b6c1879b7ea1b82765a0bfb9f563d25c429a899c1bc6d05a7d7"},"schema_version":"1.0"},"canonical_sha256":"91fc406ad98c87afe5cb583bfe4c35c257ce5f1c120b3d25d2f1aa54ddf5ed37","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:24:04.798215Z","signature_b64":"FNJqH9gQN92C5SP2GZlR29QAodfgmQkHJYSANYQogz/PfAd/nKh1cCf7MQw24EegwPLWqOiJQroNKKc3Y5TLDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"91fc406ad98c87afe5cb583bfe4c35c257ce5f1c120b3d25d2f1aa54ddf5ed37","last_reissued_at":"2026-05-18T00:24:04.797665Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:24:04.797665Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1407.4908","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:24:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cQYdqXLX7b7R6jeY2SUNaeYupSdNnZapXe9C3uDR0vQlYLP78jBT6LwzFMz26t4Ye9N+eDXhqD4adn4GWzUIBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-27T10:06:10.127660Z"},"content_sha256":"fb8e67f75f2398323fc302c340474deb2706968cd669e0ccee8f76fad23394f3","schema_version":"1.0","event_id":"sha256:fb8e67f75f2398323fc302c340474deb2706968cd669e0ccee8f76fad23394f3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2014:SH6EA2WZRSD27ZOLLA574TBVYJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Integrating R and Hadoop for Big Data Analysis","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Bogdan Oancea, Raluca Mariana Dragoescu","submitted_at":"2014-07-18T08:17:55Z","abstract_excerpt":"Analyzing and working with big data could be very diffi cult using classical means like relational database management systems or desktop software packages for statistics and visualization. Instead, big data requires large clusters with hundreds or even thousands of computing nodes. Offi cial statistics is increasingly considering big data for deriving new statistics because big data sources could produce more relevant and timely statistics than traditional sources. One of the software tools successfully and wide spread used for storage and processing of big data sets on clusters of commodity "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1407.4908","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:24:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Is0Skj19fvaFsP6cOKv9PSMIodkKrC2DTXPyu2G39kLru+7OVzc89bsjoZapUfvV/jiiee8ywm2eRlgQRStRCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-27T10:06:10.128007Z"},"content_sha256":"7d1bed5e434b12d2927af1a964d3a4be5aedee1a5a436262264189e5baaab88f","schema_version":"1.0","event_id":"sha256:7d1bed5e434b12d2927af1a964d3a4be5aedee1a5a436262264189e5baaab88f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SH6EA2WZRSD27ZOLLA574TBVYJ/bundle.json","state_url":"https://pith.science/pith/SH6EA2WZRSD27ZOLLA574TBVYJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SH6EA2WZRSD27ZOLLA574TBVYJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-27T10:06:10Z","links":{"resolver":"https://pith.science/pith/SH6EA2WZRSD27ZOLLA574TBVYJ","bundle":"https://pith.science/pith/SH6EA2WZRSD27ZOLLA574TBVYJ/bundle.json","state":"https://pith.science/pith/SH6EA2WZRSD27ZOLLA574TBVYJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SH6EA2WZRSD27ZOLLA574TBVYJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:SH6EA2WZRSD27ZOLLA574TBVYJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9ad99b0e6cf13b6c1879b7ea1b82765a0bfb9f563d25c429a899c1bc6d05a7d7","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.DC","submitted_at":"2014-07-18T08:17:55Z","title_canon_sha256":"f2bdce76e4bf7b9d79de8d9ad47e249aa1f0650ecdc0545c6b2192c577c642c0"},"schema_version":"1.0","source":{"id":"1407.4908","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1407.4908","created_at":"2026-05-18T00:24:04Z"},{"alias_kind":"arxiv_version","alias_value":"1407.4908v1","created_at":"2026-05-18T00:24:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1407.4908","created_at":"2026-05-18T00:24:04Z"},{"alias_kind":"pith_short_12","alias_value":"SH6EA2WZRSD2","created_at":"2026-05-18T12:28:49Z"},{"alias_kind":"pith_short_16","alias_value":"SH6EA2WZRSD27ZOL","created_at":"2026-05-18T12:28:49Z"},{"alias_kind":"pith_short_8","alias_value":"SH6EA2WZ","created_at":"2026-05-18T12:28:49Z"}],"graph_snapshots":[{"event_id":"sha256:7d1bed5e434b12d2927af1a964d3a4be5aedee1a5a436262264189e5baaab88f","target":"graph","created_at":"2026-05-18T00:24:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Analyzing and working with big data could be very diffi cult using classical means like relational database management systems or desktop software packages for statistics and visualization. Instead, big data requires large clusters with hundreds or even thousands of computing nodes. Offi cial statistics is increasingly considering big data for deriving new statistics because big data sources could produce more relevant and timely statistics than traditional sources. One of the software tools successfully and wide spread used for storage and processing of big data sets on clusters of commodity ","authors_text":"Bogdan Oancea, Raluca Mariana Dragoescu","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.DC","submitted_at":"2014-07-18T08:17:55Z","title":"Integrating R and Hadoop for Big Data Analysis"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1407.4908","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fb8e67f75f2398323fc302c340474deb2706968cd669e0ccee8f76fad23394f3","target":"record","created_at":"2026-05-18T00:24:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9ad99b0e6cf13b6c1879b7ea1b82765a0bfb9f563d25c429a899c1bc6d05a7d7","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.DC","submitted_at":"2014-07-18T08:17:55Z","title_canon_sha256":"f2bdce76e4bf7b9d79de8d9ad47e249aa1f0650ecdc0545c6b2192c577c642c0"},"schema_version":"1.0","source":{"id":"1407.4908","kind":"arxiv","version":1}},"canonical_sha256":"91fc406ad98c87afe5cb583bfe4c35c257ce5f1c120b3d25d2f1aa54ddf5ed37","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"91fc406ad98c87afe5cb583bfe4c35c257ce5f1c120b3d25d2f1aa54ddf5ed37","first_computed_at":"2026-05-18T00:24:04.797665Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:24:04.797665Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"FNJqH9gQN92C5SP2GZlR29QAodfgmQkHJYSANYQogz/PfAd/nKh1cCf7MQw24EegwPLWqOiJQroNKKc3Y5TLDA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:24:04.798215Z","signed_message":"canonical_sha256_bytes"},"source_id":"1407.4908","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fb8e67f75f2398323fc302c340474deb2706968cd669e0ccee8f76fad23394f3","sha256:7d1bed5e434b12d2927af1a964d3a4be5aedee1a5a436262264189e5baaab88f"],"state_sha256":"c59380be8c32754ca80e4b4b267bbb4a558b90d33b8b5fe17daf7347f640f4d1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"flLBCVzmG9D87WTEhh9XefEMB+W94rdkvr7oN+gfWxDo+PdvAhI1V153I1n/OswujsA+2gA7VAP+inTOeOdoBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-27T10:06:10.129939Z","bundle_sha256":"d36422ebafbe054b55f13c9c5add618cb8270ba606f5d8a7a24684809988fa84"}}