{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:TWXDM4DIQSPBTRISYS3URT6OWU","short_pith_number":"pith:TWXDM4DI","canonical_record":{"source":{"id":"2606.31128","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SD","submitted_at":"2026-06-30T04:46:45Z","cross_cats_sorted":["cs.AI","cs.CL","eess.AS"],"title_canon_sha256":"93de76e505d85e9fc57b11c9e738bdf1a067ce7002855be0a7e86fd10615f867","abstract_canon_sha256":"56fc1e43975fbedee5e21d77b9f4a141c8218075220a1198136191c875773cff"},"schema_version":"1.0"},"canonical_sha256":"9dae367068849e19c512c4b748cfceb524b81a12c829a0b62e5c9b2c62c76f7a","source":{"kind":"arxiv","id":"2606.31128","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.31128","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"arxiv_version","alias_value":"2606.31128v1","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.31128","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"pith_short_12","alias_value":"TWXDM4DIQSPB","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"pith_short_16","alias_value":"TWXDM4DIQSPBTRIS","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"pith_short_8","alias_value":"TWXDM4DI","created_at":"2026-07-01T01:17:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:TWXDM4DIQSPBTRISYS3URT6OWU","target":"record","payload":{"canonical_record":{"source":{"id":"2606.31128","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SD","submitted_at":"2026-06-30T04:46:45Z","cross_cats_sorted":["cs.AI","cs.CL","eess.AS"],"title_canon_sha256":"93de76e505d85e9fc57b11c9e738bdf1a067ce7002855be0a7e86fd10615f867","abstract_canon_sha256":"56fc1e43975fbedee5e21d77b9f4a141c8218075220a1198136191c875773cff"},"schema_version":"1.0"},"canonical_sha256":"9dae367068849e19c512c4b748cfceb524b81a12c829a0b62e5c9b2c62c76f7a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-01T01:17:30.022499Z","signature_b64":"BwUM6yDCSnL38+z3hexQEDD2ki3aX4Og4YQ45+QcwwWtkTolnA8B2GAoQXER042YhMwpqt5EK+NdmzbdDKAwBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9dae367068849e19c512c4b748cfceb524b81a12c829a0b62e5c9b2c62c76f7a","last_reissued_at":"2026-07-01T01:17:30.022077Z","signature_status":"signed_v1","first_computed_at":"2026-07-01T01:17:30.022077Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.31128","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T01:17:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uf/pYJPpjny4GbZs7G+oQNvJ7WqCKGjNwa1AvBRcq6Efe7Usqr93EcfOYhT+JYVLFNs0aRSSterK99cEulTMBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T16:21:59.644744Z"},"content_sha256":"13a7bc1574aa5f3c04533fa765f2f915f48000828fb35b21548daa68e50a59e3","schema_version":"1.0","event_id":"sha256:13a7bc1574aa5f3c04533fa765f2f915f48000828fb35b21548daa68e50a59e3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:TWXDM4DIQSPBTRISYS3URT6OWU","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"UniSAE: Unified Speech Attribute Editing on Speaker, Emotion and Low-Level Content via Discrete Phonetic Posteriorgram Modelling","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":["cs.AI","cs.CL","eess.AS"],"primary_cat":"cs.SD","authors_text":"Chuanbo Zhu, Kun Qian, Rongxiu Zhong, Shilei Zhang, Wei Xue, Wuyou Zhou, Yike Guo","submitted_at":"2026-06-30T04:46:45Z","abstract_excerpt":"Speech editing aims to modify specific portions of an utterance while preserving the remaining speech. Existing approaches primarily focus on word-level content modification and typically treat content, speaker, and emotion editing as separate tasks, limiting both editing granularity and flexibility. We propose UniSAE, a unified speech attribute editing framework which supports composable speaker, emotion and content editing from sub-phoneme to word level within a single architecture. UniSAE introduces a Discrete Phonetic PosteriorGram (DPPG) representation that factorizes speech content into "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.31128","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.31128/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T01:17:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"amlKEjuEImpCPuffite1+zNffU4//uE7QYy0NUMy4GBJ1u4ylfT7mkx4HFVhzYSkyixB17L2bFssWJHLNDGhAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T16:21:59.645128Z"},"content_sha256":"1ae67eab8c9e1151189e27a94e3014064b8c32934e9acf5b82b48764b9abf5a5","schema_version":"1.0","event_id":"sha256:1ae67eab8c9e1151189e27a94e3014064b8c32934e9acf5b82b48764b9abf5a5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/TWXDM4DIQSPBTRISYS3URT6OWU/bundle.json","state_url":"https://pith.science/pith/TWXDM4DIQSPBTRISYS3URT6OWU/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/TWXDM4DIQSPBTRISYS3URT6OWU/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T16:21:59Z","links":{"resolver":"https://pith.science/pith/TWXDM4DIQSPBTRISYS3URT6OWU","bundle":"https://pith.science/pith/TWXDM4DIQSPBTRISYS3URT6OWU/bundle.json","state":"https://pith.science/pith/TWXDM4DIQSPBTRISYS3URT6OWU/state.json","well_known_bundle":"https://pith.science/.well-known/pith/TWXDM4DIQSPBTRISYS3URT6OWU/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:TWXDM4DIQSPBTRISYS3URT6OWU","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"56fc1e43975fbedee5e21d77b9f4a141c8218075220a1198136191c875773cff","cross_cats_sorted":["cs.AI","cs.CL","eess.AS"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SD","submitted_at":"2026-06-30T04:46:45Z","title_canon_sha256":"93de76e505d85e9fc57b11c9e738bdf1a067ce7002855be0a7e86fd10615f867"},"schema_version":"1.0","source":{"id":"2606.31128","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.31128","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"arxiv_version","alias_value":"2606.31128v1","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.31128","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"pith_short_12","alias_value":"TWXDM4DIQSPB","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"pith_short_16","alias_value":"TWXDM4DIQSPBTRIS","created_at":"2026-07-01T01:17:30Z"},{"alias_kind":"pith_short_8","alias_value":"TWXDM4DI","created_at":"2026-07-01T01:17:30Z"}],"graph_snapshots":[{"event_id":"sha256:1ae67eab8c9e1151189e27a94e3014064b8c32934e9acf5b82b48764b9abf5a5","target":"graph","created_at":"2026-07-01T01:17:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.31128/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Speech editing aims to modify specific portions of an utterance while preserving the remaining speech. Existing approaches primarily focus on word-level content modification and typically treat content, speaker, and emotion editing as separate tasks, limiting both editing granularity and flexibility. We propose UniSAE, a unified speech attribute editing framework which supports composable speaker, emotion and content editing from sub-phoneme to word level within a single architecture. UniSAE introduces a Discrete Phonetic PosteriorGram (DPPG) representation that factorizes speech content into ","authors_text":"Chuanbo Zhu, Kun Qian, Rongxiu Zhong, Shilei Zhang, Wei Xue, Wuyou Zhou, Yike Guo","cross_cats":["cs.AI","cs.CL","eess.AS"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SD","submitted_at":"2026-06-30T04:46:45Z","title":"UniSAE: Unified Speech Attribute Editing on Speaker, Emotion and Low-Level Content via Discrete Phonetic Posteriorgram Modelling"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.31128","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:13a7bc1574aa5f3c04533fa765f2f915f48000828fb35b21548daa68e50a59e3","target":"record","created_at":"2026-07-01T01:17:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"56fc1e43975fbedee5e21d77b9f4a141c8218075220a1198136191c875773cff","cross_cats_sorted":["cs.AI","cs.CL","eess.AS"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SD","submitted_at":"2026-06-30T04:46:45Z","title_canon_sha256":"93de76e505d85e9fc57b11c9e738bdf1a067ce7002855be0a7e86fd10615f867"},"schema_version":"1.0","source":{"id":"2606.31128","kind":"arxiv","version":1}},"canonical_sha256":"9dae367068849e19c512c4b748cfceb524b81a12c829a0b62e5c9b2c62c76f7a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9dae367068849e19c512c4b748cfceb524b81a12c829a0b62e5c9b2c62c76f7a","first_computed_at":"2026-07-01T01:17:30.022077Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-01T01:17:30.022077Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"BwUM6yDCSnL38+z3hexQEDD2ki3aX4Og4YQ45+QcwwWtkTolnA8B2GAoQXER042YhMwpqt5EK+NdmzbdDKAwBA==","signature_status":"signed_v1","signed_at":"2026-07-01T01:17:30.022499Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.31128","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:13a7bc1574aa5f3c04533fa765f2f915f48000828fb35b21548daa68e50a59e3","sha256:1ae67eab8c9e1151189e27a94e3014064b8c32934e9acf5b82b48764b9abf5a5"],"state_sha256":"63755eed6874324796de96b2243ff91c4d21762d92b83915b0f7356dc24eaebf"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ddolHTacyM6yPJl7q1hQ9CjLCUXKacTiTRMqeetNYZpAOr8vRXZvcd9qlcOOXjVEZJ311Y1NtKHfFlc8E0B0CA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T16:21:59.647131Z","bundle_sha256":"1cf40c14662263c8de5b608527fca34d7765cde5888596098f836dfdb721dece"}}