{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:WVXTDVCSIAUHGTYM4ZEBIV426E","short_pith_number":"pith:WVXTDVCS","canonical_record":{"source":{"id":"1505.02065","kind":"arxiv","version":6},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-05-08T15:32:43Z","cross_cats_sorted":[],"title_canon_sha256":"888a99130c753cb862401dc6bdac26907e62d514463bc0907d57cd586edd61cd","abstract_canon_sha256":"8892f9c945681c1ae88291b35062e8cf9a0865fbad6a44d7a842b494d6475cdf"},"schema_version":"1.0"},"canonical_sha256":"b56f31d4524028734f0ce64814579af11ef9260a425439978de52df8c141db34","source":{"kind":"arxiv","id":"1505.02065","version":6},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1505.02065","created_at":"2026-05-18T00:46:43Z"},{"alias_kind":"arxiv_version","alias_value":"1505.02065v6","created_at":"2026-05-18T00:46:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1505.02065","created_at":"2026-05-18T00:46:43Z"},{"alias_kind":"pith_short_12","alias_value":"WVXTDVCSIAUH","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_16","alias_value":"WVXTDVCSIAUHGTYM","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_8","alias_value":"WVXTDVCS","created_at":"2026-05-18T12:29:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:WVXTDVCSIAUHGTYM4ZEBIV426E","target":"record","payload":{"canonical_record":{"source":{"id":"1505.02065","kind":"arxiv","version":6},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-05-08T15:32:43Z","cross_cats_sorted":[],"title_canon_sha256":"888a99130c753cb862401dc6bdac26907e62d514463bc0907d57cd586edd61cd","abstract_canon_sha256":"8892f9c945681c1ae88291b35062e8cf9a0865fbad6a44d7a842b494d6475cdf"},"schema_version":"1.0"},"canonical_sha256":"b56f31d4524028734f0ce64814579af11ef9260a425439978de52df8c141db34","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:46:43.252217Z","signature_b64":"8qEm4bU7Klw3WO6nkRqMPX+jSh093P5uoZLPmllUUl6eXYV4Oig19TPqrRJGIEEmHlacDmQgO04tm58X/bopBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b56f31d4524028734f0ce64814579af11ef9260a425439978de52df8c141db34","last_reissued_at":"2026-05-18T00:46:43.251451Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:46:43.251451Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1505.02065","source_version":6,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:46:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MVBKzcWXbLpZd8TKziX55IEhUPlVPPiH5rxoEq8qCElH4s6X2Cj9u5bl6/VhBzfDhWTBgRYQcrZyqQ6jOjHTBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T10:01:19.010568Z"},"content_sha256":"ebd10c197316c645b8011910061f6e26b8bb2aa4f65494f1ed5374ea4db37def","schema_version":"1.0","event_id":"sha256:ebd10c197316c645b8011910061f6e26b8bb2aa4f65494f1ed5374ea4db37def"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:WVXTDVCSIAUHGTYM4ZEBIV426E","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Dense Distributions from Sparse Samples: Improved Gibbs Sampling Parameter Estimators for LDA","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"stat.ML","authors_text":"Grigorios Tsoumakas, James R. Foulds, Timothy N. Rubin, Yannis Papanikolaou","submitted_at":"2015-05-08T15:32:43Z","abstract_excerpt":"We introduce a novel approach for estimating Latent Dirichlet Allocation (LDA) parameters from collapsed Gibbs samples (CGS), by leveraging the full conditional distributions over the latent variable assignments to efficiently average over multiple samples, for little more computational cost than drawing a single additional collapsed Gibbs sample. Our approach can be understood as adapting the soft clustering methodology of Collapsed Variational Bayes (CVB0) to CGS parameter estimation, in order to get the best of both techniques. Our estimators can straightforwardly be applied to the output o"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1505.02065","kind":"arxiv","version":6},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:46:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Ch5ytyRF07vPU3dhqAnGkWKe2LldNPaTuHRkhR2MIu9s7p5kNDYTxoNpebd5Vp00ru6YUXOTGRwJ9QZt5x9YDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T10:01:19.010907Z"},"content_sha256":"5f29e31122dab6c212210e0936af702e2bfd3a94eddb9baaba82cd867bca393f","schema_version":"1.0","event_id":"sha256:5f29e31122dab6c212210e0936af702e2bfd3a94eddb9baaba82cd867bca393f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WVXTDVCSIAUHGTYM4ZEBIV426E/bundle.json","state_url":"https://pith.science/pith/WVXTDVCSIAUHGTYM4ZEBIV426E/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WVXTDVCSIAUHGTYM4ZEBIV426E/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T10:01:19Z","links":{"resolver":"https://pith.science/pith/WVXTDVCSIAUHGTYM4ZEBIV426E","bundle":"https://pith.science/pith/WVXTDVCSIAUHGTYM4ZEBIV426E/bundle.json","state":"https://pith.science/pith/WVXTDVCSIAUHGTYM4ZEBIV426E/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WVXTDVCSIAUHGTYM4ZEBIV426E/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:WVXTDVCSIAUHGTYM4ZEBIV426E","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8892f9c945681c1ae88291b35062e8cf9a0865fbad6a44d7a842b494d6475cdf","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-05-08T15:32:43Z","title_canon_sha256":"888a99130c753cb862401dc6bdac26907e62d514463bc0907d57cd586edd61cd"},"schema_version":"1.0","source":{"id":"1505.02065","kind":"arxiv","version":6}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1505.02065","created_at":"2026-05-18T00:46:43Z"},{"alias_kind":"arxiv_version","alias_value":"1505.02065v6","created_at":"2026-05-18T00:46:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1505.02065","created_at":"2026-05-18T00:46:43Z"},{"alias_kind":"pith_short_12","alias_value":"WVXTDVCSIAUH","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_16","alias_value":"WVXTDVCSIAUHGTYM","created_at":"2026-05-18T12:29:47Z"},{"alias_kind":"pith_short_8","alias_value":"WVXTDVCS","created_at":"2026-05-18T12:29:47Z"}],"graph_snapshots":[{"event_id":"sha256:5f29e31122dab6c212210e0936af702e2bfd3a94eddb9baaba82cd867bca393f","target":"graph","created_at":"2026-05-18T00:46:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We introduce a novel approach for estimating Latent Dirichlet Allocation (LDA) parameters from collapsed Gibbs samples (CGS), by leveraging the full conditional distributions over the latent variable assignments to efficiently average over multiple samples, for little more computational cost than drawing a single additional collapsed Gibbs sample. Our approach can be understood as adapting the soft clustering methodology of Collapsed Variational Bayes (CVB0) to CGS parameter estimation, in order to get the best of both techniques. Our estimators can straightforwardly be applied to the output o","authors_text":"Grigorios Tsoumakas, James R. Foulds, Timothy N. Rubin, Yannis Papanikolaou","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-05-08T15:32:43Z","title":"Dense Distributions from Sparse Samples: Improved Gibbs Sampling Parameter Estimators for LDA"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1505.02065","kind":"arxiv","version":6},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ebd10c197316c645b8011910061f6e26b8bb2aa4f65494f1ed5374ea4db37def","target":"record","created_at":"2026-05-18T00:46:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8892f9c945681c1ae88291b35062e8cf9a0865fbad6a44d7a842b494d6475cdf","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-05-08T15:32:43Z","title_canon_sha256":"888a99130c753cb862401dc6bdac26907e62d514463bc0907d57cd586edd61cd"},"schema_version":"1.0","source":{"id":"1505.02065","kind":"arxiv","version":6}},"canonical_sha256":"b56f31d4524028734f0ce64814579af11ef9260a425439978de52df8c141db34","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b56f31d4524028734f0ce64814579af11ef9260a425439978de52df8c141db34","first_computed_at":"2026-05-18T00:46:43.251451Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:46:43.251451Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"8qEm4bU7Klw3WO6nkRqMPX+jSh093P5uoZLPmllUUl6eXYV4Oig19TPqrRJGIEEmHlacDmQgO04tm58X/bopBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:46:43.252217Z","signed_message":"canonical_sha256_bytes"},"source_id":"1505.02065","source_kind":"arxiv","source_version":6}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ebd10c197316c645b8011910061f6e26b8bb2aa4f65494f1ed5374ea4db37def","sha256:5f29e31122dab6c212210e0936af702e2bfd3a94eddb9baaba82cd867bca393f"],"state_sha256":"f35be6dd6edb1b270051ed5dad235f11898036b0e50583271c3623e5839a9877"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kLCiBlrCwKxbIDyQ/2o81+6GrRaH6t4yXbpXOCf8OoUNvDi1IXFFKGR6ve50Bfyo/cyZ37VWkd1YjZyi09dCBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T10:01:19.012770Z","bundle_sha256":"d6c4283f06ca9f586efbfb3b4d67312c3c59cab3215954038324bdaf41a0a36b"}}