{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:XHUXQYCSUAWXWUYBZRARHHFWNX","short_pith_number":"pith:XHUXQYCS","canonical_record":{"source":{"id":"1703.08741","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2017-03-25T20:57:56Z","cross_cats_sorted":[],"title_canon_sha256":"cf2355300fe81ad06677d7ff109ff5686f78da9e180b96cca89f5dd3d9ba54bc","abstract_canon_sha256":"90f9f532cad15d03b6baf50981459e2144b27e5493e7dd525bdcfc1bb8d5b4d5"},"schema_version":"1.0"},"canonical_sha256":"b9e9786052a02d7b5301cc41139cb66dca788a6909eef71f99fed368f37e6b7d","source":{"kind":"arxiv","id":"1703.08741","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.08741","created_at":"2026-05-18T00:21:35Z"},{"alias_kind":"arxiv_version","alias_value":"1703.08741v2","created_at":"2026-05-18T00:21:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.08741","created_at":"2026-05-18T00:21:35Z"},{"alias_kind":"pith_short_12","alias_value":"XHUXQYCSUAWX","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_16","alias_value":"XHUXQYCSUAWXWUYB","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_8","alias_value":"XHUXQYCS","created_at":"2026-05-18T12:31:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:XHUXQYCSUAWXWUYBZRARHHFWNX","target":"record","payload":{"canonical_record":{"source":{"id":"1703.08741","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2017-03-25T20:57:56Z","cross_cats_sorted":[],"title_canon_sha256":"cf2355300fe81ad06677d7ff109ff5686f78da9e180b96cca89f5dd3d9ba54bc","abstract_canon_sha256":"90f9f532cad15d03b6baf50981459e2144b27e5493e7dd525bdcfc1bb8d5b4d5"},"schema_version":"1.0"},"canonical_sha256":"b9e9786052a02d7b5301cc41139cb66dca788a6909eef71f99fed368f37e6b7d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:21:35.163153Z","signature_b64":"9JjL1iBIPau53uOUrzw/yV0xX9QFHOVj1nEuwHhklru3GAhquNQAuCc79A6ELAh+bGy2kvtUpjzLoROfhqG+AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b9e9786052a02d7b5301cc41139cb66dca788a6909eef71f99fed368f37e6b7d","last_reissued_at":"2026-05-18T00:21:35.162526Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:21:35.162526Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1703.08741","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:21:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"d5OX26XyxQ/osvB6a2FPC6UVXnJ5RpkbCRjReKlm/ah07z/fLZ/a3X4mj+Xm9qTm2lPJQy9uQUV4RcCXnJbSAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-20T10:14:15.290485Z"},"content_sha256":"a52f1a269ec103580da9f2c3cc9b9e688f0402365df27340be15608d4f75b0c2","schema_version":"1.0","event_id":"sha256:a52f1a269ec103580da9f2c3cc9b9e688f0402365df27340be15608d4f75b0c2"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:XHUXQYCSUAWXWUYBZRARHHFWNX","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Clustering and Variable Selection in the Presence of Mixed Variable Types and Missing Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"stat.ME","authors_text":"Amy Weaver, Curtis Storlie, John Port, Paul Croarkin, Robert Colligan, Robert Voigt, Ruth Stoeckel, Scott Myers, S Katusic","submitted_at":"2017-03-25T20:57:56Z","abstract_excerpt":"We consider the problem of model-based clustering in the presence of many correlated, mixed continuous and discrete variables, some of which may have missing values. Discrete variables are treated with a latent continuous variable approach and the Dirichlet process is used to construct a mixture model with an unknown number of components. Variable selection is also performed to identify the variables that are most influential for determining cluster membership. The work is motivated by the need to cluster patients thought to potentially have autism spectrum disorder (ASD) on the basis of many "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.08741","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:21:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jqctbj37Md5yBzp8j3D1vgxn65qWx5JTRMLX9y7d2/ZpvMNHOsa8tNHr4xnFR+HHdzdSgYfql04hXQpa3R77Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-20T10:14:15.290827Z"},"content_sha256":"f723f07ead66e13ec8b88f5661f110c8eefaa5047b2c0228fdee0947f227818a","schema_version":"1.0","event_id":"sha256:f723f07ead66e13ec8b88f5661f110c8eefaa5047b2c0228fdee0947f227818a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XHUXQYCSUAWXWUYBZRARHHFWNX/bundle.json","state_url":"https://pith.science/pith/XHUXQYCSUAWXWUYBZRARHHFWNX/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XHUXQYCSUAWXWUYBZRARHHFWNX/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-20T10:14:15Z","links":{"resolver":"https://pith.science/pith/XHUXQYCSUAWXWUYBZRARHHFWNX","bundle":"https://pith.science/pith/XHUXQYCSUAWXWUYBZRARHHFWNX/bundle.json","state":"https://pith.science/pith/XHUXQYCSUAWXWUYBZRARHHFWNX/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XHUXQYCSUAWXWUYBZRARHHFWNX/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:XHUXQYCSUAWXWUYBZRARHHFWNX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"90f9f532cad15d03b6baf50981459e2144b27e5493e7dd525bdcfc1bb8d5b4d5","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2017-03-25T20:57:56Z","title_canon_sha256":"cf2355300fe81ad06677d7ff109ff5686f78da9e180b96cca89f5dd3d9ba54bc"},"schema_version":"1.0","source":{"id":"1703.08741","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.08741","created_at":"2026-05-18T00:21:35Z"},{"alias_kind":"arxiv_version","alias_value":"1703.08741v2","created_at":"2026-05-18T00:21:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.08741","created_at":"2026-05-18T00:21:35Z"},{"alias_kind":"pith_short_12","alias_value":"XHUXQYCSUAWX","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_16","alias_value":"XHUXQYCSUAWXWUYB","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_8","alias_value":"XHUXQYCS","created_at":"2026-05-18T12:31:53Z"}],"graph_snapshots":[{"event_id":"sha256:f723f07ead66e13ec8b88f5661f110c8eefaa5047b2c0228fdee0947f227818a","target":"graph","created_at":"2026-05-18T00:21:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We consider the problem of model-based clustering in the presence of many correlated, mixed continuous and discrete variables, some of which may have missing values. Discrete variables are treated with a latent continuous variable approach and the Dirichlet process is used to construct a mixture model with an unknown number of components. Variable selection is also performed to identify the variables that are most influential for determining cluster membership. The work is motivated by the need to cluster patients thought to potentially have autism spectrum disorder (ASD) on the basis of many ","authors_text":"Amy Weaver, Curtis Storlie, John Port, Paul Croarkin, Robert Colligan, Robert Voigt, Ruth Stoeckel, Scott Myers, S Katusic","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2017-03-25T20:57:56Z","title":"Clustering and Variable Selection in the Presence of Mixed Variable Types and Missing Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.08741","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a52f1a269ec103580da9f2c3cc9b9e688f0402365df27340be15608d4f75b0c2","target":"record","created_at":"2026-05-18T00:21:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"90f9f532cad15d03b6baf50981459e2144b27e5493e7dd525bdcfc1bb8d5b4d5","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2017-03-25T20:57:56Z","title_canon_sha256":"cf2355300fe81ad06677d7ff109ff5686f78da9e180b96cca89f5dd3d9ba54bc"},"schema_version":"1.0","source":{"id":"1703.08741","kind":"arxiv","version":2}},"canonical_sha256":"b9e9786052a02d7b5301cc41139cb66dca788a6909eef71f99fed368f37e6b7d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b9e9786052a02d7b5301cc41139cb66dca788a6909eef71f99fed368f37e6b7d","first_computed_at":"2026-05-18T00:21:35.162526Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:21:35.162526Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"9JjL1iBIPau53uOUrzw/yV0xX9QFHOVj1nEuwHhklru3GAhquNQAuCc79A6ELAh+bGy2kvtUpjzLoROfhqG+AA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:21:35.163153Z","signed_message":"canonical_sha256_bytes"},"source_id":"1703.08741","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a52f1a269ec103580da9f2c3cc9b9e688f0402365df27340be15608d4f75b0c2","sha256:f723f07ead66e13ec8b88f5661f110c8eefaa5047b2c0228fdee0947f227818a"],"state_sha256":"5400f48b530c3cc84d8df19153d45809656c3e60d05755b92bafc00a2271ae10"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fHS8hxTNF0eLmi3n3VWMzEBalwoxJ0CCNhAkUFcpE0HrbbncEHUvyJ1QReE3CM5cnYU2kLUPgsXEaSSDaRKTCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-20T10:14:15.292722Z","bundle_sha256":"aad657921bf5ee803a3a319faf426b81cab4c7867dabf2dd8340ae50620bb7ef"}}