{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:KOT6CL3ANMEURBU4IDC2OKRGEH","short_pith_number":"pith:KOT6CL3A","canonical_record":{"source":{"id":"2602.00443","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-01-31T01:38:55Z","cross_cats_sorted":["cs.MM","eess.AS"],"title_canon_sha256":"815ede98a0e19829d189cc7cd3d26a5ca8a5bee85627099d72bfe124146cd118","abstract_canon_sha256":"5760227cc5b784a5dca211356dda4aed3848aea374af6823f5f9501432440a9e"},"schema_version":"1.0"},"canonical_sha256":"53a7e12f606b0948869c40c5a72a2621c1ed741ee3d789ad0e10d5802d9cae91","source":{"kind":"arxiv","id":"2602.00443","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.00443","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"arxiv_version","alias_value":"2602.00443v2","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.00443","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"pith_short_12","alias_value":"KOT6CL3ANMEU","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"pith_short_16","alias_value":"KOT6CL3ANMEURBU4","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"pith_short_8","alias_value":"KOT6CL3A","created_at":"2026-05-26T02:04:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:KOT6CL3ANMEURBU4IDC2OKRGEH","target":"record","payload":{"canonical_record":{"source":{"id":"2602.00443","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-01-31T01:38:55Z","cross_cats_sorted":["cs.MM","eess.AS"],"title_canon_sha256":"815ede98a0e19829d189cc7cd3d26a5ca8a5bee85627099d72bfe124146cd118","abstract_canon_sha256":"5760227cc5b784a5dca211356dda4aed3848aea374af6823f5f9501432440a9e"},"schema_version":"1.0"},"canonical_sha256":"53a7e12f606b0948869c40c5a72a2621c1ed741ee3d789ad0e10d5802d9cae91","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-26T02:04:04.047861Z","signature_b64":"QK7GR8q5uOFbPeh/w6Qxexo1O9WCH90J7cNpfAMh9ppJnBMbgkuIH7Unu8+SZxfqcHRcoB3fEVOv3/Pbzb+BDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"53a7e12f606b0948869c40c5a72a2621c1ed741ee3d789ad0e10d5802d9cae91","last_reissued_at":"2026-05-26T02:04:04.046981Z","signature_status":"signed_v1","first_computed_at":"2026-05-26T02:04:04.046981Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2602.00443","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T02:04:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sGzcet18s8rga5axuymZFY4gmvY/G0NY/lRBDrhSG0FdfnV1/tA5zcNE0odAQn/R8zCvX36aApG4zzBp95MMBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T13:34:08.821498Z"},"content_sha256":"3deff6b4585264793ac18420c37ba448f42abd388f589840ffa40f31ab599dc8","schema_version":"1.0","event_id":"sha256:3deff6b4585264793ac18420c37ba448f42abd388f589840ffa40f31ab599dc8"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:KOT6CL3ANMEURBU4IDC2OKRGEH","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"RVCBench: Benchmarking the Robustness of Voice Cloning Across Modern Audio Generation Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.MM","eess.AS"],"primary_cat":"cs.SD","authors_text":"Deval Pandya, Hanlin Yu, Ruinan Jin, Xiaoxiao Li, Xinting Liao","submitted_at":"2026-01-31T01:38:55Z","abstract_excerpt":"Modern voice cloning, also known as zero-shot text-to-speech (TTS), can synthesize speech that closely matches a target speaker from only seconds of reference audio, enabling applications such as personalized speech interfaces and dubbing. In practice, these systems often face noisy reference audio, imperfect text prompts, multilingual and long-form generation, post-processing, and adversarial perturbations, all of which can weaken robustness. Despite rapid progress in codec-token language models and diffusion-based TTS, robustness under realistic deployment shifts remains underexplored. This "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.00443","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2602.00443/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T02:04:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vxUTi+6yOGospSDJqBsPqjopBGWTnFqkOY3hUOw9cEzVD4BCqTE++MEy2Gm9j8sRsihtRq+WjFw+RnjluLpwDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T13:34:08.821864Z"},"content_sha256":"44f12aef073b8559b3d65fb3f79f3c342e0b03ea4b4364f045731ad09864198d","schema_version":"1.0","event_id":"sha256:44f12aef073b8559b3d65fb3f79f3c342e0b03ea4b4364f045731ad09864198d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/KOT6CL3ANMEURBU4IDC2OKRGEH/bundle.json","state_url":"https://pith.science/pith/KOT6CL3ANMEURBU4IDC2OKRGEH/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/KOT6CL3ANMEURBU4IDC2OKRGEH/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T13:34:08Z","links":{"resolver":"https://pith.science/pith/KOT6CL3ANMEURBU4IDC2OKRGEH","bundle":"https://pith.science/pith/KOT6CL3ANMEURBU4IDC2OKRGEH/bundle.json","state":"https://pith.science/pith/KOT6CL3ANMEURBU4IDC2OKRGEH/state.json","well_known_bundle":"https://pith.science/.well-known/pith/KOT6CL3ANMEURBU4IDC2OKRGEH/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:KOT6CL3ANMEURBU4IDC2OKRGEH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5760227cc5b784a5dca211356dda4aed3848aea374af6823f5f9501432440a9e","cross_cats_sorted":["cs.MM","eess.AS"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-01-31T01:38:55Z","title_canon_sha256":"815ede98a0e19829d189cc7cd3d26a5ca8a5bee85627099d72bfe124146cd118"},"schema_version":"1.0","source":{"id":"2602.00443","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.00443","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"arxiv_version","alias_value":"2602.00443v2","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.00443","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"pith_short_12","alias_value":"KOT6CL3ANMEU","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"pith_short_16","alias_value":"KOT6CL3ANMEURBU4","created_at":"2026-05-26T02:04:04Z"},{"alias_kind":"pith_short_8","alias_value":"KOT6CL3A","created_at":"2026-05-26T02:04:04Z"}],"graph_snapshots":[{"event_id":"sha256:44f12aef073b8559b3d65fb3f79f3c342e0b03ea4b4364f045731ad09864198d","target":"graph","created_at":"2026-05-26T02:04:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2602.00443/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Modern voice cloning, also known as zero-shot text-to-speech (TTS), can synthesize speech that closely matches a target speaker from only seconds of reference audio, enabling applications such as personalized speech interfaces and dubbing. In practice, these systems often face noisy reference audio, imperfect text prompts, multilingual and long-form generation, post-processing, and adversarial perturbations, all of which can weaken robustness. Despite rapid progress in codec-token language models and diffusion-based TTS, robustness under realistic deployment shifts remains underexplored. This ","authors_text":"Deval Pandya, Hanlin Yu, Ruinan Jin, Xiaoxiao Li, Xinting Liao","cross_cats":["cs.MM","eess.AS"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-01-31T01:38:55Z","title":"RVCBench: Benchmarking the Robustness of Voice Cloning Across Modern Audio Generation Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.00443","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3deff6b4585264793ac18420c37ba448f42abd388f589840ffa40f31ab599dc8","target":"record","created_at":"2026-05-26T02:04:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5760227cc5b784a5dca211356dda4aed3848aea374af6823f5f9501432440a9e","cross_cats_sorted":["cs.MM","eess.AS"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-01-31T01:38:55Z","title_canon_sha256":"815ede98a0e19829d189cc7cd3d26a5ca8a5bee85627099d72bfe124146cd118"},"schema_version":"1.0","source":{"id":"2602.00443","kind":"arxiv","version":2}},"canonical_sha256":"53a7e12f606b0948869c40c5a72a2621c1ed741ee3d789ad0e10d5802d9cae91","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"53a7e12f606b0948869c40c5a72a2621c1ed741ee3d789ad0e10d5802d9cae91","first_computed_at":"2026-05-26T02:04:04.046981Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-26T02:04:04.046981Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"QK7GR8q5uOFbPeh/w6Qxexo1O9WCH90J7cNpfAMh9ppJnBMbgkuIH7Unu8+SZxfqcHRcoB3fEVOv3/Pbzb+BDw==","signature_status":"signed_v1","signed_at":"2026-05-26T02:04:04.047861Z","signed_message":"canonical_sha256_bytes"},"source_id":"2602.00443","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3deff6b4585264793ac18420c37ba448f42abd388f589840ffa40f31ab599dc8","sha256:44f12aef073b8559b3d65fb3f79f3c342e0b03ea4b4364f045731ad09864198d"],"state_sha256":"420df2b61ec6c8a775fe40cf219605a13014c5485b3f69ea2008bc08240adbf1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qFtV6bCux76qqZ9o+JypKLIz+ZMaVd07TCH7TncJhY/7U1pUpTZnq5uAAYd2A7Y4j6Na2LEpuTN7pkdly0YICw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T13:34:08.823792Z","bundle_sha256":"60717ef18499f16257ab82e8bf247090522e1cee5c53678fcb28438680d50154"}}