{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:STEVJY6CYHYU4GRPMWXRHNVAP2","short_pith_number":"pith:STEVJY6C","canonical_record":{"source":{"id":"2606.07631","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-31T04:28:21Z","cross_cats_sorted":["cs.AI","cs.CY"],"title_canon_sha256":"1c949e7fc7fe22e1bc185ecf4a9a066120e7e4f4c9ac93bf19b62bb15ca7e393","abstract_canon_sha256":"35e318a81a995000dce9c8b5823bb33b1be88729b186229c76bd12f77393a13d"},"schema_version":"1.0"},"canonical_sha256":"94c954e3c2c1f14e1a2f65af13b6a07e9fed098907cbc2340130c28d6c07cddd","source":{"kind":"arxiv","id":"2606.07631","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07631","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07631v1","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07631","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"pith_short_12","alias_value":"STEVJY6CYHYU","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"pith_short_16","alias_value":"STEVJY6CYHYU4GRP","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"pith_short_8","alias_value":"STEVJY6C","created_at":"2026-06-09T00:04:45Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:STEVJY6CYHYU4GRPMWXRHNVAP2","target":"record","payload":{"canonical_record":{"source":{"id":"2606.07631","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-31T04:28:21Z","cross_cats_sorted":["cs.AI","cs.CY"],"title_canon_sha256":"1c949e7fc7fe22e1bc185ecf4a9a066120e7e4f4c9ac93bf19b62bb15ca7e393","abstract_canon_sha256":"35e318a81a995000dce9c8b5823bb33b1be88729b186229c76bd12f77393a13d"},"schema_version":"1.0"},"canonical_sha256":"94c954e3c2c1f14e1a2f65af13b6a07e9fed098907cbc2340130c28d6c07cddd","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T00:04:45.249121Z","signature_b64":"0tMZJx+SJBwCovxd7LaQns4aid7RLE9SxDbeiAjNfEiUZdrbqhiFh5ik16NQgUsF0ktQG5TDrNMbBovcNhIzDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"94c954e3c2c1f14e1a2f65af13b6a07e9fed098907cbc2340130c28d6c07cddd","last_reissued_at":"2026-06-09T00:04:45.248782Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T00:04:45.248782Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.07631","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T00:04:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hDivgh1/QjBa8YHg1H3eay2n85+AkNuTgrXENjnY+7jJ49dPjT1QRQjKT9pIZb16AI3bOspDcAtSVeQmJy3fCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-29T11:30:36.105538Z"},"content_sha256":"76fabc8e26d95bce0b1d98c0dd4ea25ef9175144e037eea30f1d46b78f517c0e","schema_version":"1.0","event_id":"sha256:76fabc8e26d95bce0b1d98c0dd4ea25ef9175144e037eea30f1d46b78f517c0e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:STEVJY6CYHYU4GRPMWXRHNVAP2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Trait-space Monitoring for Emergent Misalignment During Supervised Finetuning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.CY"],"primary_cat":"cs.LG","authors_text":"Hal Daum\\'e III, Huy Nghiem, Sarah Wiegreffe, Sy-Tuyen Ho","submitted_at":"2026-05-31T04:28:21Z","abstract_excerpt":"Emergent misalignment (EM) occurs when narrow finetuning causes a model to behave dangerously outside the finetuning task. Standard training signals can miss this shift, making reliable detection costly if it depends on repeated behavioral evaluation. We ask whether emergent misalignment can instead be detected from internal representations during finetuning. Using seven alignment-relevant traits encoded as linear directions in activation space, we track representational drift across training checkpoints in four open-source 7-9B LLMs. EM-relevant drift concentrates on a low-dimensional axis th"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07631","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.07631/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T00:04:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hTl5vc6AWGrHR63dj7zifhtf1IRyJCqUhbdHdtGHTapzWU2+s9BSUCtC8O8Ee0A4AkjjHOQKU81Ld8VSsVAtDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-29T11:30:36.105929Z"},"content_sha256":"0c275d8ea457d705c936ff33d595fefc87c27b9638bedb50c9a9e5783d63f95d","schema_version":"1.0","event_id":"sha256:0c275d8ea457d705c936ff33d595fefc87c27b9638bedb50c9a9e5783d63f95d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/STEVJY6CYHYU4GRPMWXRHNVAP2/bundle.json","state_url":"https://pith.science/pith/STEVJY6CYHYU4GRPMWXRHNVAP2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/STEVJY6CYHYU4GRPMWXRHNVAP2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-29T11:30:36Z","links":{"resolver":"https://pith.science/pith/STEVJY6CYHYU4GRPMWXRHNVAP2","bundle":"https://pith.science/pith/STEVJY6CYHYU4GRPMWXRHNVAP2/bundle.json","state":"https://pith.science/pith/STEVJY6CYHYU4GRPMWXRHNVAP2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/STEVJY6CYHYU4GRPMWXRHNVAP2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:STEVJY6CYHYU4GRPMWXRHNVAP2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"35e318a81a995000dce9c8b5823bb33b1be88729b186229c76bd12f77393a13d","cross_cats_sorted":["cs.AI","cs.CY"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-31T04:28:21Z","title_canon_sha256":"1c949e7fc7fe22e1bc185ecf4a9a066120e7e4f4c9ac93bf19b62bb15ca7e393"},"schema_version":"1.0","source":{"id":"2606.07631","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07631","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07631v1","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07631","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"pith_short_12","alias_value":"STEVJY6CYHYU","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"pith_short_16","alias_value":"STEVJY6CYHYU4GRP","created_at":"2026-06-09T00:04:45Z"},{"alias_kind":"pith_short_8","alias_value":"STEVJY6C","created_at":"2026-06-09T00:04:45Z"}],"graph_snapshots":[{"event_id":"sha256:0c275d8ea457d705c936ff33d595fefc87c27b9638bedb50c9a9e5783d63f95d","target":"graph","created_at":"2026-06-09T00:04:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.07631/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Emergent misalignment (EM) occurs when narrow finetuning causes a model to behave dangerously outside the finetuning task. Standard training signals can miss this shift, making reliable detection costly if it depends on repeated behavioral evaluation. We ask whether emergent misalignment can instead be detected from internal representations during finetuning. Using seven alignment-relevant traits encoded as linear directions in activation space, we track representational drift across training checkpoints in four open-source 7-9B LLMs. EM-relevant drift concentrates on a low-dimensional axis th","authors_text":"Hal Daum\\'e III, Huy Nghiem, Sarah Wiegreffe, Sy-Tuyen Ho","cross_cats":["cs.AI","cs.CY"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-31T04:28:21Z","title":"Trait-space Monitoring for Emergent Misalignment During Supervised Finetuning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07631","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:76fabc8e26d95bce0b1d98c0dd4ea25ef9175144e037eea30f1d46b78f517c0e","target":"record","created_at":"2026-06-09T00:04:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"35e318a81a995000dce9c8b5823bb33b1be88729b186229c76bd12f77393a13d","cross_cats_sorted":["cs.AI","cs.CY"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-31T04:28:21Z","title_canon_sha256":"1c949e7fc7fe22e1bc185ecf4a9a066120e7e4f4c9ac93bf19b62bb15ca7e393"},"schema_version":"1.0","source":{"id":"2606.07631","kind":"arxiv","version":1}},"canonical_sha256":"94c954e3c2c1f14e1a2f65af13b6a07e9fed098907cbc2340130c28d6c07cddd","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"94c954e3c2c1f14e1a2f65af13b6a07e9fed098907cbc2340130c28d6c07cddd","first_computed_at":"2026-06-09T00:04:45.248782Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T00:04:45.248782Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"0tMZJx+SJBwCovxd7LaQns4aid7RLE9SxDbeiAjNfEiUZdrbqhiFh5ik16NQgUsF0ktQG5TDrNMbBovcNhIzDQ==","signature_status":"signed_v1","signed_at":"2026-06-09T00:04:45.249121Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.07631","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:76fabc8e26d95bce0b1d98c0dd4ea25ef9175144e037eea30f1d46b78f517c0e","sha256:0c275d8ea457d705c936ff33d595fefc87c27b9638bedb50c9a9e5783d63f95d"],"state_sha256":"324a8b68ec396bf1d57bf5b9cfbc8473095f3ffb1b327cb3b1b313eb441ce8a2"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0fMdc46f9dfxbak8SRuwkKCZMuGTjguaG+gv0Daw755ucyeTGlHay5yHgAPnf1euKsV1pEo8WUScZbtjJQvlCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-29T11:30:36.107949Z","bundle_sha256":"5064f38e28b463b7ba1b7c7558fbf997c2801d354302cfb21e8b4ed9d2d871b4"}}