{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:ASOSH5O4COI5T7JTL2PJNQ2KKB","short_pith_number":"pith:ASOSH5O4","canonical_record":{"source":{"id":"2512.15134","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-12-17T06:54:08Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"6b0194b57b8c4a0e03864a56d9870660e9692b5660b0e3782987e25f2c67bf93","abstract_canon_sha256":"7c7bcf313bc17798175b3bb03ff5cdd9e95e67fa570a0c53c6ee81c6d128a23c"},"schema_version":"1.0"},"canonical_sha256":"049d23f5dc1391d9fd335e9e96c34a504cfaad669efd46fe7758cd1e2b42f82a","source":{"kind":"arxiv","id":"2512.15134","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2512.15134","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"arxiv_version","alias_value":"2512.15134v2","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2512.15134","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"pith_short_12","alias_value":"ASOSH5O4COI5","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"pith_short_16","alias_value":"ASOSH5O4COI5T7JT","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"pith_short_8","alias_value":"ASOSH5O4","created_at":"2026-06-12T01:08:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:ASOSH5O4COI5T7JTL2PJNQ2KKB","target":"record","payload":{"canonical_record":{"source":{"id":"2512.15134","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-12-17T06:54:08Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"6b0194b57b8c4a0e03864a56d9870660e9692b5660b0e3782987e25f2c67bf93","abstract_canon_sha256":"7c7bcf313bc17798175b3bb03ff5cdd9e95e67fa570a0c53c6ee81c6d128a23c"},"schema_version":"1.0"},"canonical_sha256":"049d23f5dc1391d9fd335e9e96c34a504cfaad669efd46fe7758cd1e2b42f82a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-12T01:08:19.671523Z","signature_b64":"v+6kA0+mJ/U70bGA7kL/VI1OvuxMEuSUtzOwNBoHJEVVRFbU3Y2uwuE2PwOb8vETLkAOzBZjMGbykHOX8UpYDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"049d23f5dc1391d9fd335e9e96c34a504cfaad669efd46fe7758cd1e2b42f82a","last_reissued_at":"2026-06-12T01:08:19.670409Z","signature_status":"signed_v1","first_computed_at":"2026-06-12T01:08:19.670409Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2512.15134","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-12T01:08:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cWOUIXCbY56G4gRfL3FQxPuWOlbzhi781O8CcC0sM9wShi9hlgb4eIWRd5drJUyubVVxKqiWnZbvbB8G9rN1AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-23T14:54:32.294678Z"},"content_sha256":"3825025f39374e5570c58768005189131f725ba7790440254a57de6aa1c45c80","schema_version":"1.0","event_id":"sha256:3825025f39374e5570c58768005189131f725ba7790440254a57de6aa1c45c80"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:ASOSH5O4COI5T7JTL2PJNQ2KKB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"From Isolation to Entanglement: When Do Interpretability Methods Identify and Disentangle Known Concepts?","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Aaron Mueller, Andrew Lee, Dhanya Sridhar, Ekdeep Singh Lubana, Patrik Reizinger, Shruti Joshi","submitted_at":"2025-12-17T06:54:08Z","abstract_excerpt":"A goal of interpretability is to recover disentangled representations of latent concepts (features) from the activations of neural networks. The quality of features is typically evaluated in isolation, and under implicit independence assumptions that may not hold in practice. Thus, it is unclear to what extent common featurization methods such as sparse autoencoders (SAEs) and probes disentangle one concept from another. We propose a multi-concept evaluation setting using concepts including sentiment, domain, voice, and tense. We evaluate how well featurizers produce disentangled representatio"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2512.15134","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2512.15134/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-12T01:08:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hFdiO9zbJ77tBfuXiDywKOQE3w+7+oBoOAZGMY17JROHQKjArGS+/ur/upTDCx3NtlfA2A7NQgp0KFn7ib55Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-23T14:54:32.295063Z"},"content_sha256":"4d62ed8c08a6d8e49f24a61bb1c5ce4566b2e4201fc0c48f24dfeb163b0acbb7","schema_version":"1.0","event_id":"sha256:4d62ed8c08a6d8e49f24a61bb1c5ce4566b2e4201fc0c48f24dfeb163b0acbb7"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB/bundle.json","state_url":"https://pith.science/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-23T14:54:32Z","links":{"resolver":"https://pith.science/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB","bundle":"https://pith.science/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB/bundle.json","state":"https://pith.science/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ASOSH5O4COI5T7JTL2PJNQ2KKB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:ASOSH5O4COI5T7JTL2PJNQ2KKB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7c7bcf313bc17798175b3bb03ff5cdd9e95e67fa570a0c53c6ee81c6d128a23c","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-12-17T06:54:08Z","title_canon_sha256":"6b0194b57b8c4a0e03864a56d9870660e9692b5660b0e3782987e25f2c67bf93"},"schema_version":"1.0","source":{"id":"2512.15134","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2512.15134","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"arxiv_version","alias_value":"2512.15134v2","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2512.15134","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"pith_short_12","alias_value":"ASOSH5O4COI5","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"pith_short_16","alias_value":"ASOSH5O4COI5T7JT","created_at":"2026-06-12T01:08:19Z"},{"alias_kind":"pith_short_8","alias_value":"ASOSH5O4","created_at":"2026-06-12T01:08:19Z"}],"graph_snapshots":[{"event_id":"sha256:4d62ed8c08a6d8e49f24a61bb1c5ce4566b2e4201fc0c48f24dfeb163b0acbb7","target":"graph","created_at":"2026-06-12T01:08:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2512.15134/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"A goal of interpretability is to recover disentangled representations of latent concepts (features) from the activations of neural networks. The quality of features is typically evaluated in isolation, and under implicit independence assumptions that may not hold in practice. Thus, it is unclear to what extent common featurization methods such as sparse autoencoders (SAEs) and probes disentangle one concept from another. We propose a multi-concept evaluation setting using concepts including sentiment, domain, voice, and tense. We evaluate how well featurizers produce disentangled representatio","authors_text":"Aaron Mueller, Andrew Lee, Dhanya Sridhar, Ekdeep Singh Lubana, Patrik Reizinger, Shruti Joshi","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-12-17T06:54:08Z","title":"From Isolation to Entanglement: When Do Interpretability Methods Identify and Disentangle Known Concepts?"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2512.15134","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3825025f39374e5570c58768005189131f725ba7790440254a57de6aa1c45c80","target":"record","created_at":"2026-06-12T01:08:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7c7bcf313bc17798175b3bb03ff5cdd9e95e67fa570a0c53c6ee81c6d128a23c","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-12-17T06:54:08Z","title_canon_sha256":"6b0194b57b8c4a0e03864a56d9870660e9692b5660b0e3782987e25f2c67bf93"},"schema_version":"1.0","source":{"id":"2512.15134","kind":"arxiv","version":2}},"canonical_sha256":"049d23f5dc1391d9fd335e9e96c34a504cfaad669efd46fe7758cd1e2b42f82a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"049d23f5dc1391d9fd335e9e96c34a504cfaad669efd46fe7758cd1e2b42f82a","first_computed_at":"2026-06-12T01:08:19.670409Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-12T01:08:19.670409Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"v+6kA0+mJ/U70bGA7kL/VI1OvuxMEuSUtzOwNBoHJEVVRFbU3Y2uwuE2PwOb8vETLkAOzBZjMGbykHOX8UpYDA==","signature_status":"signed_v1","signed_at":"2026-06-12T01:08:19.671523Z","signed_message":"canonical_sha256_bytes"},"source_id":"2512.15134","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3825025f39374e5570c58768005189131f725ba7790440254a57de6aa1c45c80","sha256:4d62ed8c08a6d8e49f24a61bb1c5ce4566b2e4201fc0c48f24dfeb163b0acbb7"],"state_sha256":"404352704c98f46d4a72061e440c8b93a6a1238071ad9175d1f482d875583c75"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Vtk1hcxI/PwZRSMyFxBcpGsyT2DUaek+89VlvOtgoo5shQJnAXDt0+pjSjQLZ8d1smurnfhbfAT8Ra5B8WHiAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-23T14:54:32.297125Z","bundle_sha256":"2ade59c76145bd3bc08a2d64ff05fb8e41194729861d7000e09084018be96155"}}