{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2014:7UYPZP6HTLDGJ4ZKOJU3C7HN7H","short_pith_number":"pith:7UYPZP6H","canonical_record":{"source":{"id":"1410.4792","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2014-10-17T16:46:45Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"3b8c97fce321bbfb3a819168af3f22fa798ed191fcb9f498dbc149a235f2e8d4","abstract_canon_sha256":"5ed63dedbbed5fca586abe89b33e6d22e97d4e59e22eb32d28279914f18be09f"},"schema_version":"1.0"},"canonical_sha256":"fd30fcbfc79ac664f32a7269b17cedf9fb2b0eaae56cc0c7ad9447f35da16fd4","source":{"kind":"arxiv","id":"1410.4792","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1410.4792","created_at":"2026-05-18T02:39:54Z"},{"alias_kind":"arxiv_version","alias_value":"1410.4792v1","created_at":"2026-05-18T02:39:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1410.4792","created_at":"2026-05-18T02:39:54Z"},{"alias_kind":"pith_short_12","alias_value":"7UYPZP6HTLDG","created_at":"2026-05-18T12:28:19Z"},{"alias_kind":"pith_short_16","alias_value":"7UYPZP6HTLDGJ4ZK","created_at":"2026-05-18T12:28:19Z"},{"alias_kind":"pith_short_8","alias_value":"7UYPZP6H","created_at":"2026-05-18T12:28:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2014:7UYPZP6HTLDGJ4ZKOJU3C7HN7H","target":"record","payload":{"canonical_record":{"source":{"id":"1410.4792","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2014-10-17T16:46:45Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"3b8c97fce321bbfb3a819168af3f22fa798ed191fcb9f498dbc149a235f2e8d4","abstract_canon_sha256":"5ed63dedbbed5fca586abe89b33e6d22e97d4e59e22eb32d28279914f18be09f"},"schema_version":"1.0"},"canonical_sha256":"fd30fcbfc79ac664f32a7269b17cedf9fb2b0eaae56cc0c7ad9447f35da16fd4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:39:54.722823Z","signature_b64":"sp54LFtbYbOrfVC0TmiQdjZ85l+FCB3Sq7ty6rW+3ddCVf6lUuQ+JgNRlZ6ttqcTTeOwoDKA+Pd9AJ0Ir1jXDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"fd30fcbfc79ac664f32a7269b17cedf9fb2b0eaae56cc0c7ad9447f35da16fd4","last_reissued_at":"2026-05-18T02:39:54.722221Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:39:54.722221Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1410.4792","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:39:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PZBZ7Mgojmnc/LnkGzgcFnYjxtv8FO8h0dFtALNeIMfTs66CuliYVpvlCQfK0zEt2wZ4jGJdYUO0k/78lmNRAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-21T12:35:57.225053Z"},"content_sha256":"02eac5ba34075681218da985293956a9772bdce1f0c5138c8bb3659ca2630af8","schema_version":"1.0","event_id":"sha256:02eac5ba34075681218da985293956a9772bdce1f0c5138c8bb3659ca2630af8"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2014:7UYPZP6HTLDGJ4ZKOJU3C7HN7H","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Variational Bayes for Merging Noisy Databases","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"stat.ME","authors_text":"Rebecca C. Steorts, Tamara Broderick","submitted_at":"2014-10-17T16:46:45Z","abstract_excerpt":"Bayesian entity resolution merges together multiple, noisy databases and returns the minimal collection of unique individuals represented, together with their true, latent record values. Bayesian methods allow flexible generative models that share power across databases as well as principled quantification of uncertainty for queries of the final, resolved database. However, existing Bayesian methods for entity resolution use Markov monte Carlo method (MCMC) approximations and are too slow to run on modern databases containing millions or billions of records. Instead, we propose applying variat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1410.4792","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:39:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0X2TFnoegH9rOLRvR8lmu/OJe0/KSV+vgu/XmWb/KBCh/vYJqHGJ77v07crB8HTb75YWAo0V6eg+RRyifrOnDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-21T12:35:57.225417Z"},"content_sha256":"4f78f7edb4d4a120172cc3054b9b4a749e053bdc1efeb2a214bd3a1516f97727","schema_version":"1.0","event_id":"sha256:4f78f7edb4d4a120172cc3054b9b4a749e053bdc1efeb2a214bd3a1516f97727"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H/bundle.json","state_url":"https://pith.science/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-21T12:35:57Z","links":{"resolver":"https://pith.science/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H","bundle":"https://pith.science/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H/bundle.json","state":"https://pith.science/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7UYPZP6HTLDGJ4ZKOJU3C7HN7H/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2014:7UYPZP6HTLDGJ4ZKOJU3C7HN7H","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5ed63dedbbed5fca586abe89b33e6d22e97d4e59e22eb32d28279914f18be09f","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2014-10-17T16:46:45Z","title_canon_sha256":"3b8c97fce321bbfb3a819168af3f22fa798ed191fcb9f498dbc149a235f2e8d4"},"schema_version":"1.0","source":{"id":"1410.4792","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1410.4792","created_at":"2026-05-18T02:39:54Z"},{"alias_kind":"arxiv_version","alias_value":"1410.4792v1","created_at":"2026-05-18T02:39:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1410.4792","created_at":"2026-05-18T02:39:54Z"},{"alias_kind":"pith_short_12","alias_value":"7UYPZP6HTLDG","created_at":"2026-05-18T12:28:19Z"},{"alias_kind":"pith_short_16","alias_value":"7UYPZP6HTLDGJ4ZK","created_at":"2026-05-18T12:28:19Z"},{"alias_kind":"pith_short_8","alias_value":"7UYPZP6H","created_at":"2026-05-18T12:28:19Z"}],"graph_snapshots":[{"event_id":"sha256:4f78f7edb4d4a120172cc3054b9b4a749e053bdc1efeb2a214bd3a1516f97727","target":"graph","created_at":"2026-05-18T02:39:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Bayesian entity resolution merges together multiple, noisy databases and returns the minimal collection of unique individuals represented, together with their true, latent record values. Bayesian methods allow flexible generative models that share power across databases as well as principled quantification of uncertainty for queries of the final, resolved database. However, existing Bayesian methods for entity resolution use Markov monte Carlo method (MCMC) approximations and are too slow to run on modern databases containing millions or billions of records. Instead, we propose applying variat","authors_text":"Rebecca C. Steorts, Tamara Broderick","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2014-10-17T16:46:45Z","title":"Variational Bayes for Merging Noisy Databases"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1410.4792","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:02eac5ba34075681218da985293956a9772bdce1f0c5138c8bb3659ca2630af8","target":"record","created_at":"2026-05-18T02:39:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5ed63dedbbed5fca586abe89b33e6d22e97d4e59e22eb32d28279914f18be09f","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2014-10-17T16:46:45Z","title_canon_sha256":"3b8c97fce321bbfb3a819168af3f22fa798ed191fcb9f498dbc149a235f2e8d4"},"schema_version":"1.0","source":{"id":"1410.4792","kind":"arxiv","version":1}},"canonical_sha256":"fd30fcbfc79ac664f32a7269b17cedf9fb2b0eaae56cc0c7ad9447f35da16fd4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"fd30fcbfc79ac664f32a7269b17cedf9fb2b0eaae56cc0c7ad9447f35da16fd4","first_computed_at":"2026-05-18T02:39:54.722221Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:39:54.722221Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"sp54LFtbYbOrfVC0TmiQdjZ85l+FCB3Sq7ty6rW+3ddCVf6lUuQ+JgNRlZ6ttqcTTeOwoDKA+Pd9AJ0Ir1jXDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T02:39:54.722823Z","signed_message":"canonical_sha256_bytes"},"source_id":"1410.4792","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:02eac5ba34075681218da985293956a9772bdce1f0c5138c8bb3659ca2630af8","sha256:4f78f7edb4d4a120172cc3054b9b4a749e053bdc1efeb2a214bd3a1516f97727"],"state_sha256":"86beb816bb606207d6fd5ff01e7b4bbe05a1c9762c6426f28c18c1676471362c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fuo+6092QqWuLW2YaNApSk4Xp1h2hUB9QtUgYq7mgrco7ZOIRAB4zBXCDgKXws7GbPFHVexMcN2kQwZltZ6wBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-21T12:35:57.227434Z","bundle_sha256":"4c1ed78001b696d69edba984acf24eff400e815fc46f61838b074d04b1fdec1a"}}