{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:PSFYY35Z5Q43PE36YMYAXH7EE7","short_pith_number":"pith:PSFYY35Z","canonical_record":{"source":{"id":"1709.07941","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-09-22T20:49:41Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"b3d69454522d28bb4283a8d05b0f99cc1fc754d343346cf1c1da974c7516c928","abstract_canon_sha256":"384c995f09672499e665e11b85293f57d715a8d08f78b171f6c283aaed14b254"},"schema_version":"1.0"},"canonical_sha256":"7c8b8c6fb9ec39b7937ec3300b9fe427d1a3d8f88dc13f4e4eedef4f42ff5a0e","source":{"kind":"arxiv","id":"1709.07941","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.07941","created_at":"2026-05-18T00:34:28Z"},{"alias_kind":"arxiv_version","alias_value":"1709.07941v1","created_at":"2026-05-18T00:34:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.07941","created_at":"2026-05-18T00:34:28Z"},{"alias_kind":"pith_short_12","alias_value":"PSFYY35Z5Q43","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_16","alias_value":"PSFYY35Z5Q43PE36","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_8","alias_value":"PSFYY35Z","created_at":"2026-05-18T12:31:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:PSFYY35Z5Q43PE36YMYAXH7EE7","target":"record","payload":{"canonical_record":{"source":{"id":"1709.07941","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-09-22T20:49:41Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"b3d69454522d28bb4283a8d05b0f99cc1fc754d343346cf1c1da974c7516c928","abstract_canon_sha256":"384c995f09672499e665e11b85293f57d715a8d08f78b171f6c283aaed14b254"},"schema_version":"1.0"},"canonical_sha256":"7c8b8c6fb9ec39b7937ec3300b9fe427d1a3d8f88dc13f4e4eedef4f42ff5a0e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:34:28.471526Z","signature_b64":"Bb9rSeoh437BLVLRTig7dXmOPN1oEb2eQt/nqpH51SjTZiUoWSKrf8cqryRFSbX9eiPiRByM9MtKF83k9v5PDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7c8b8c6fb9ec39b7937ec3300b9fe427d1a3d8f88dc13f4e4eedef4f42ff5a0e","last_reissued_at":"2026-05-18T00:34:28.471095Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:34:28.471095Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1709.07941","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:34:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uVNJxC+mTeUqgIIJbIqYFXUaP3/bZ6uhNFs6ykSYeqbhbgGaF2L0oDfDC7HzMfjCvKq3CFivSGzFKu+se9GICA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-21T01:39:20.026374Z"},"content_sha256":"c287156d56b058f1d1bd083d1c572de42fb8c5af8e9dd4cad11207398f4c3d15","schema_version":"1.0","event_id":"sha256:c287156d56b058f1d1bd083d1c572de42fb8c5af8e9dd4cad11207398f4c3d15"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:PSFYY35Z5Q43PE36YMYAXH7EE7","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Efficiently Discovering Locally Exceptional yet Globally Representative Subgroups","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.DB","authors_text":"Janis Kalofolias, Jilles Vreeken, Mario Boley","submitted_at":"2017-09-22T20:49:41Z","abstract_excerpt":"Subgroup discovery is a local pattern mining technique to find interpretable descriptions of sub-populations that stand out on a given target variable. That is, these sub-populations are exceptional with regard to the global distribution. In this paper we argue that in many applications, such as scientific discovery, subgroups are only useful if they are additionally representative of the global distribution with regard to a control variable. That is, when the distribution of this control variable is the same, or almost the same, as over the whole data.\n  We formalise this objective function a"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.07941","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:34:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MrrBTZB0HZm0LbYd559aYJtOH5SKSOoWTxML7IfjQVHcj56umv+k3fbMZORC1IrOJKNnGdSyFf+ko6JTFx3nBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-21T01:39:20.026755Z"},"content_sha256":"d12dce0e50ca1b4de3bb1a6b4bf1e70744fa9f665bc00dd9c2946ecd20a7679f","schema_version":"1.0","event_id":"sha256:d12dce0e50ca1b4de3bb1a6b4bf1e70744fa9f665bc00dd9c2946ecd20a7679f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/PSFYY35Z5Q43PE36YMYAXH7EE7/bundle.json","state_url":"https://pith.science/pith/PSFYY35Z5Q43PE36YMYAXH7EE7/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/PSFYY35Z5Q43PE36YMYAXH7EE7/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-21T01:39:20Z","links":{"resolver":"https://pith.science/pith/PSFYY35Z5Q43PE36YMYAXH7EE7","bundle":"https://pith.science/pith/PSFYY35Z5Q43PE36YMYAXH7EE7/bundle.json","state":"https://pith.science/pith/PSFYY35Z5Q43PE36YMYAXH7EE7/state.json","well_known_bundle":"https://pith.science/.well-known/pith/PSFYY35Z5Q43PE36YMYAXH7EE7/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:PSFYY35Z5Q43PE36YMYAXH7EE7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"384c995f09672499e665e11b85293f57d715a8d08f78b171f6c283aaed14b254","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-09-22T20:49:41Z","title_canon_sha256":"b3d69454522d28bb4283a8d05b0f99cc1fc754d343346cf1c1da974c7516c928"},"schema_version":"1.0","source":{"id":"1709.07941","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.07941","created_at":"2026-05-18T00:34:28Z"},{"alias_kind":"arxiv_version","alias_value":"1709.07941v1","created_at":"2026-05-18T00:34:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.07941","created_at":"2026-05-18T00:34:28Z"},{"alias_kind":"pith_short_12","alias_value":"PSFYY35Z5Q43","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_16","alias_value":"PSFYY35Z5Q43PE36","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_8","alias_value":"PSFYY35Z","created_at":"2026-05-18T12:31:37Z"}],"graph_snapshots":[{"event_id":"sha256:d12dce0e50ca1b4de3bb1a6b4bf1e70744fa9f665bc00dd9c2946ecd20a7679f","target":"graph","created_at":"2026-05-18T00:34:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Subgroup discovery is a local pattern mining technique to find interpretable descriptions of sub-populations that stand out on a given target variable. That is, these sub-populations are exceptional with regard to the global distribution. In this paper we argue that in many applications, such as scientific discovery, subgroups are only useful if they are additionally representative of the global distribution with regard to a control variable. That is, when the distribution of this control variable is the same, or almost the same, as over the whole data.\n  We formalise this objective function a","authors_text":"Janis Kalofolias, Jilles Vreeken, Mario Boley","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-09-22T20:49:41Z","title":"Efficiently Discovering Locally Exceptional yet Globally Representative Subgroups"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.07941","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c287156d56b058f1d1bd083d1c572de42fb8c5af8e9dd4cad11207398f4c3d15","target":"record","created_at":"2026-05-18T00:34:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"384c995f09672499e665e11b85293f57d715a8d08f78b171f6c283aaed14b254","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DB","submitted_at":"2017-09-22T20:49:41Z","title_canon_sha256":"b3d69454522d28bb4283a8d05b0f99cc1fc754d343346cf1c1da974c7516c928"},"schema_version":"1.0","source":{"id":"1709.07941","kind":"arxiv","version":1}},"canonical_sha256":"7c8b8c6fb9ec39b7937ec3300b9fe427d1a3d8f88dc13f4e4eedef4f42ff5a0e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7c8b8c6fb9ec39b7937ec3300b9fe427d1a3d8f88dc13f4e4eedef4f42ff5a0e","first_computed_at":"2026-05-18T00:34:28.471095Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:34:28.471095Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Bb9rSeoh437BLVLRTig7dXmOPN1oEb2eQt/nqpH51SjTZiUoWSKrf8cqryRFSbX9eiPiRByM9MtKF83k9v5PDw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:34:28.471526Z","signed_message":"canonical_sha256_bytes"},"source_id":"1709.07941","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c287156d56b058f1d1bd083d1c572de42fb8c5af8e9dd4cad11207398f4c3d15","sha256:d12dce0e50ca1b4de3bb1a6b4bf1e70744fa9f665bc00dd9c2946ecd20a7679f"],"state_sha256":"bf4cb9efd0de7a70e8971f6dd6d765581d292f07d2dfba9b3b98c374fda95404"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5WS8nYJDpApKgPwEN3+P7MyUr7B18MLJ1bixGvAmStdKfvteXz0WuTmQL9Vj4ioA3JNwrJqAlhdN6shWW9KDBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-21T01:39:20.028731Z","bundle_sha256":"45158477c598ede9680a08ac32e32de6ba6f0f8f9d7f550e7d783040a0977ffb"}}