{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:X22ST5UIHTPMSUGRVMG4HU4SM6","short_pith_number":"pith:X22ST5UI","canonical_record":{"source":{"id":"2605.19922","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T14:45:59Z","cross_cats_sorted":["cs.DB"],"title_canon_sha256":"4997eddd9767459d4753da04957b5d8e6b9db49151aa8f014fd171d862e34291","abstract_canon_sha256":"4e4ca3aa4151b52c1cdb18ea9c4455de33b47654dfbfcf116fc49f0689003c3c"},"schema_version":"1.0"},"canonical_sha256":"beb529f6883cdec950d1ab0dc3d3926787794c233e1bc457a4e00ceee262fb18","source":{"kind":"arxiv","id":"2605.19922","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19922","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19922v1","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19922","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"pith_short_12","alias_value":"X22ST5UIHTPM","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"pith_short_16","alias_value":"X22ST5UIHTPMSUGR","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"pith_short_8","alias_value":"X22ST5UI","created_at":"2026-05-20T02:05:55Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:X22ST5UIHTPMSUGRVMG4HU4SM6","target":"record","payload":{"canonical_record":{"source":{"id":"2605.19922","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T14:45:59Z","cross_cats_sorted":["cs.DB"],"title_canon_sha256":"4997eddd9767459d4753da04957b5d8e6b9db49151aa8f014fd171d862e34291","abstract_canon_sha256":"4e4ca3aa4151b52c1cdb18ea9c4455de33b47654dfbfcf116fc49f0689003c3c"},"schema_version":"1.0"},"canonical_sha256":"beb529f6883cdec950d1ab0dc3d3926787794c233e1bc457a4e00ceee262fb18","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T02:05:55.431560Z","signature_b64":"DYLRpp9j0ABJVDmbG2dbkGjakatoT34AIVP2cOtPchmKeZ+nOuPQYPx8y9F35zUF/tnnJ2btuR2b3Hh+EAkrAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"beb529f6883cdec950d1ab0dc3d3926787794c233e1bc457a4e00ceee262fb18","last_reissued_at":"2026-05-20T02:05:55.430615Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T02:05:55.430615Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.19922","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T02:05:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oyuy6Urw7/9hmedckfNOqD042U7D23oU8/070U9R1zqYCBTcfrSRmGkRbfEOWCWUh6eTlMXgaLtymk+RcBlRBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T16:44:57.627101Z"},"content_sha256":"5147081ed8c7f24a649aa098b3f491cc39c9098d1b900a31d6a0b36fec0d64df","schema_version":"1.0","event_id":"sha256:5147081ed8c7f24a649aa098b3f491cc39c9098d1b900a31d6a0b36fec0d64df"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:X22ST5UIHTPMSUGRVMG4HU4SM6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"OpenHealth Lake: Designing and testing a data lakehouse platform for health applications","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.DB"],"primary_cat":"cs.SE","authors_text":"Cheryl Baxter, Danilo Silva, Joicymara Xavier, Marcel Dunaiski, Monika Moir, Tulio de Oliveira","submitted_at":"2026-05-19T14:45:59Z","abstract_excerpt":"Data management can be a complex challenge in fields such as bioinformatics and health sciences, which continuously generate extensive heterogeneous datasets. In the context of collaborative global health initiatives, secure storage and sharing of data are crucial to support impactful research. However, the absence of a unified data management platform complicates efficient data exchange and governance within these initiatives. In this paper, we introduce the design process of OpenHealth Lake, a data management prototype platform based on a data lakehouse architecture, data federation, and the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19922","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.19922/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T02:05:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"asGzGW9zEIQ0LQ9UO2+9ndBmvfmpEfVvTNy1WrV/qZEPke1rTvt7c/SBjTePsYXrByU0Ytve+7IHg8s4B4mdBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T16:44:57.627498Z"},"content_sha256":"57945d3bfa3b5e964de6ace41eba76eaec6f5e2d6900b384031d253e19cb68a9","schema_version":"1.0","event_id":"sha256:57945d3bfa3b5e964de6ace41eba76eaec6f5e2d6900b384031d253e19cb68a9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/X22ST5UIHTPMSUGRVMG4HU4SM6/bundle.json","state_url":"https://pith.science/pith/X22ST5UIHTPMSUGRVMG4HU4SM6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/X22ST5UIHTPMSUGRVMG4HU4SM6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T16:44:57Z","links":{"resolver":"https://pith.science/pith/X22ST5UIHTPMSUGRVMG4HU4SM6","bundle":"https://pith.science/pith/X22ST5UIHTPMSUGRVMG4HU4SM6/bundle.json","state":"https://pith.science/pith/X22ST5UIHTPMSUGRVMG4HU4SM6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/X22ST5UIHTPMSUGRVMG4HU4SM6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:X22ST5UIHTPMSUGRVMG4HU4SM6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4e4ca3aa4151b52c1cdb18ea9c4455de33b47654dfbfcf116fc49f0689003c3c","cross_cats_sorted":["cs.DB"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T14:45:59Z","title_canon_sha256":"4997eddd9767459d4753da04957b5d8e6b9db49151aa8f014fd171d862e34291"},"schema_version":"1.0","source":{"id":"2605.19922","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19922","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19922v1","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19922","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"pith_short_12","alias_value":"X22ST5UIHTPM","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"pith_short_16","alias_value":"X22ST5UIHTPMSUGR","created_at":"2026-05-20T02:05:55Z"},{"alias_kind":"pith_short_8","alias_value":"X22ST5UI","created_at":"2026-05-20T02:05:55Z"}],"graph_snapshots":[{"event_id":"sha256:57945d3bfa3b5e964de6ace41eba76eaec6f5e2d6900b384031d253e19cb68a9","target":"graph","created_at":"2026-05-20T02:05:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.19922/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Data management can be a complex challenge in fields such as bioinformatics and health sciences, which continuously generate extensive heterogeneous datasets. In the context of collaborative global health initiatives, secure storage and sharing of data are crucial to support impactful research. However, the absence of a unified data management platform complicates efficient data exchange and governance within these initiatives. In this paper, we introduce the design process of OpenHealth Lake, a data management prototype platform based on a data lakehouse architecture, data federation, and the","authors_text":"Cheryl Baxter, Danilo Silva, Joicymara Xavier, Marcel Dunaiski, Monika Moir, Tulio de Oliveira","cross_cats":["cs.DB"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T14:45:59Z","title":"OpenHealth Lake: Designing and testing a data lakehouse platform for health applications"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19922","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5147081ed8c7f24a649aa098b3f491cc39c9098d1b900a31d6a0b36fec0d64df","target":"record","created_at":"2026-05-20T02:05:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4e4ca3aa4151b52c1cdb18ea9c4455de33b47654dfbfcf116fc49f0689003c3c","cross_cats_sorted":["cs.DB"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SE","submitted_at":"2026-05-19T14:45:59Z","title_canon_sha256":"4997eddd9767459d4753da04957b5d8e6b9db49151aa8f014fd171d862e34291"},"schema_version":"1.0","source":{"id":"2605.19922","kind":"arxiv","version":1}},"canonical_sha256":"beb529f6883cdec950d1ab0dc3d3926787794c233e1bc457a4e00ceee262fb18","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"beb529f6883cdec950d1ab0dc3d3926787794c233e1bc457a4e00ceee262fb18","first_computed_at":"2026-05-20T02:05:55.430615Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T02:05:55.430615Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"DYLRpp9j0ABJVDmbG2dbkGjakatoT34AIVP2cOtPchmKeZ+nOuPQYPx8y9F35zUF/tnnJ2btuR2b3Hh+EAkrAw==","signature_status":"signed_v1","signed_at":"2026-05-20T02:05:55.431560Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.19922","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5147081ed8c7f24a649aa098b3f491cc39c9098d1b900a31d6a0b36fec0d64df","sha256:57945d3bfa3b5e964de6ace41eba76eaec6f5e2d6900b384031d253e19cb68a9"],"state_sha256":"7260579da5b1e90fd9cbfc26599e82faf2b5e479a71302f1e24f8da24a529ea9"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1uhe3CQTrEY5sMeuJVpgfWxt5K6VFzTmdKqCJCTmvSxqcSS/jwd2NdEKUxXX+JzvKTQEfIIpTqzEAvzNcohtAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T16:44:57.629799Z","bundle_sha256":"fd8bccb714ecd0d08169c8baa6b700ff7069f2e6e53031db81afb412c6f0f0f7"}}