{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:4LJGKOX2EW7ZKHM5XEXO7UJKMJ","short_pith_number":"pith:4LJGKOX2","canonical_record":{"source":{"id":"2607.01563","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"eess.AS","submitted_at":"2026-07-02T00:43:14Z","cross_cats_sorted":[],"title_canon_sha256":"f3b1de34ce32039604ece2c61d42d3b4c08fd1281a103623b04573856a35bbb5","abstract_canon_sha256":"193f38613c0f4df12fb00aabb407c6f8ed8c2f1a9a5d9e37e85f11bc070ef266"},"schema_version":"1.0"},"canonical_sha256":"e2d2653afa25bf951d9db92eefd12a625975049ac95c9367de8cc1197b6c7594","source":{"kind":"arxiv","id":"2607.01563","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2607.01563","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"arxiv_version","alias_value":"2607.01563v1","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2607.01563","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"pith_short_12","alias_value":"4LJGKOX2EW7Z","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"pith_short_16","alias_value":"4LJGKOX2EW7ZKHM5","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"pith_short_8","alias_value":"4LJGKOX2","created_at":"2026-07-03T00:17:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:4LJGKOX2EW7ZKHM5XEXO7UJKMJ","target":"record","payload":{"canonical_record":{"source":{"id":"2607.01563","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"eess.AS","submitted_at":"2026-07-02T00:43:14Z","cross_cats_sorted":[],"title_canon_sha256":"f3b1de34ce32039604ece2c61d42d3b4c08fd1281a103623b04573856a35bbb5","abstract_canon_sha256":"193f38613c0f4df12fb00aabb407c6f8ed8c2f1a9a5d9e37e85f11bc070ef266"},"schema_version":"1.0"},"canonical_sha256":"e2d2653afa25bf951d9db92eefd12a625975049ac95c9367de8cc1197b6c7594","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-03T00:17:04.131610Z","signature_b64":"Lji8hYQPgOldUmg3zRojsfakJhaPfa+KyeeHzLqhyOcTfo6usEHQXTk0Z+KyKnShwTqlQodxNxB9joe6c/iYCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e2d2653afa25bf951d9db92eefd12a625975049ac95c9367de8cc1197b6c7594","last_reissued_at":"2026-07-03T00:17:04.131168Z","signature_status":"signed_v1","first_computed_at":"2026-07-03T00:17:04.131168Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2607.01563","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-03T00:17:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hUTuy8yCyJAcj8rtVdcuUOZ4Bnx5bfD/tl1hGyU8nH4uRJdwXy+NATwVRa/8FLoxWo7CrclV+oXO3y65G5blAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-03T12:20:59.451128Z"},"content_sha256":"c97d358d6148c7395ac9ce78d39e8f31dfc647433b6b119791802bc967cef9e0","schema_version":"1.0","event_id":"sha256:c97d358d6148c7395ac9ce78d39e8f31dfc647433b6b119791802bc967cef9e0"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:4LJGKOX2EW7ZKHM5XEXO7UJKMJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Beyond Words: Towards Effective Modeling of Non-Verbal Vocalizations in ASR","license":"http://creativecommons.org/publicdomain/zero/1.0/","headline":"","cross_cats":[],"primary_cat":"eess.AS","authors_text":"Bach Do, Florian Metze, Gene Yang, Haibin Wu, Ming Sun, Minxue Niu, Peng Su, Ruizhe Huang, Shang-Wen Li, Suwon Shon, Yossi Adi, Yuzong Liu, Zhaoheng Ni","submitted_at":"2026-07-02T00:43:14Z","abstract_excerpt":"Modern automatic speech recognition (ASR) systems excel at transcribing lexical content but often omit nonverbal vocalizations (NVs), such as laughter, breaths, coughs, and cries, that carry conversational and affective information. Modeling NVs in ASR is challenging because NV annotations are sparse and highly long-tailed, with frequent categories such as breaths and laughter dominating rarer events such as cries and coughs. We study three data-centric strategies for improving low-resource NV recognition: (1) a two-stage curriculum that first maps all NV events to a generic token and then fin"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2607.01563","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2607.01563/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-03T00:17:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cuTo/IAZraRrYaoAuKqKoF0C3Adt2H+GYCadeQJyUHzcAGZA6ftoIIKJIFxrw4ramcGhepoUKJgNXdCEhHyIAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-03T12:20:59.451526Z"},"content_sha256":"53e07be056b70d8bc1e937ce5f024f624559b008b826e270c658af9fb72d277e","schema_version":"1.0","event_id":"sha256:53e07be056b70d8bc1e937ce5f024f624559b008b826e270c658af9fb72d277e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ/bundle.json","state_url":"https://pith.science/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-03T12:20:59Z","links":{"resolver":"https://pith.science/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ","bundle":"https://pith.science/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ/bundle.json","state":"https://pith.science/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4LJGKOX2EW7ZKHM5XEXO7UJKMJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:4LJGKOX2EW7ZKHM5XEXO7UJKMJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"193f38613c0f4df12fb00aabb407c6f8ed8c2f1a9a5d9e37e85f11bc070ef266","cross_cats_sorted":[],"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"eess.AS","submitted_at":"2026-07-02T00:43:14Z","title_canon_sha256":"f3b1de34ce32039604ece2c61d42d3b4c08fd1281a103623b04573856a35bbb5"},"schema_version":"1.0","source":{"id":"2607.01563","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2607.01563","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"arxiv_version","alias_value":"2607.01563v1","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2607.01563","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"pith_short_12","alias_value":"4LJGKOX2EW7Z","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"pith_short_16","alias_value":"4LJGKOX2EW7ZKHM5","created_at":"2026-07-03T00:17:04Z"},{"alias_kind":"pith_short_8","alias_value":"4LJGKOX2","created_at":"2026-07-03T00:17:04Z"}],"graph_snapshots":[{"event_id":"sha256:53e07be056b70d8bc1e937ce5f024f624559b008b826e270c658af9fb72d277e","target":"graph","created_at":"2026-07-03T00:17:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2607.01563/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Modern automatic speech recognition (ASR) systems excel at transcribing lexical content but often omit nonverbal vocalizations (NVs), such as laughter, breaths, coughs, and cries, that carry conversational and affective information. Modeling NVs in ASR is challenging because NV annotations are sparse and highly long-tailed, with frequent categories such as breaths and laughter dominating rarer events such as cries and coughs. We study three data-centric strategies for improving low-resource NV recognition: (1) a two-stage curriculum that first maps all NV events to a generic token and then fin","authors_text":"Bach Do, Florian Metze, Gene Yang, Haibin Wu, Ming Sun, Minxue Niu, Peng Su, Ruizhe Huang, Shang-Wen Li, Suwon Shon, Yossi Adi, Yuzong Liu, Zhaoheng Ni","cross_cats":[],"headline":"","license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"eess.AS","submitted_at":"2026-07-02T00:43:14Z","title":"Beyond Words: Towards Effective Modeling of Non-Verbal Vocalizations in ASR"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2607.01563","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c97d358d6148c7395ac9ce78d39e8f31dfc647433b6b119791802bc967cef9e0","target":"record","created_at":"2026-07-03T00:17:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"193f38613c0f4df12fb00aabb407c6f8ed8c2f1a9a5d9e37e85f11bc070ef266","cross_cats_sorted":[],"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"eess.AS","submitted_at":"2026-07-02T00:43:14Z","title_canon_sha256":"f3b1de34ce32039604ece2c61d42d3b4c08fd1281a103623b04573856a35bbb5"},"schema_version":"1.0","source":{"id":"2607.01563","kind":"arxiv","version":1}},"canonical_sha256":"e2d2653afa25bf951d9db92eefd12a625975049ac95c9367de8cc1197b6c7594","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e2d2653afa25bf951d9db92eefd12a625975049ac95c9367de8cc1197b6c7594","first_computed_at":"2026-07-03T00:17:04.131168Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-03T00:17:04.131168Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Lji8hYQPgOldUmg3zRojsfakJhaPfa+KyeeHzLqhyOcTfo6usEHQXTk0Z+KyKnShwTqlQodxNxB9joe6c/iYCA==","signature_status":"signed_v1","signed_at":"2026-07-03T00:17:04.131610Z","signed_message":"canonical_sha256_bytes"},"source_id":"2607.01563","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c97d358d6148c7395ac9ce78d39e8f31dfc647433b6b119791802bc967cef9e0","sha256:53e07be056b70d8bc1e937ce5f024f624559b008b826e270c658af9fb72d277e"],"state_sha256":"cfa2b6b73c4b07ffe0ed03d284685e3a6b09f2841bebd09f9ac385f652aeada7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Hvqr4P3+MMjgV4LGB6lWs9uW57nW1WoQ6zHa9oR+Fds7QM3RCFFdMrGuKYU83k9D9tvmEZ9HfTQqBOK3SWCZDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-03T12:20:59.453621Z","bundle_sha256":"d298e3b2835c80366eb7e097ce7e361865c9fe6d14e1fcb795b9496cf92400fc"}}