{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:QSMX2Y57YN4QLS3ESHTMTNHUL5","short_pith_number":"pith:QSMX2Y57","canonical_record":{"source":{"id":"1906.09890","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2019-06-24T12:44:09Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"f403bed1c2735889cda01a30c5fd58b5f7c916c978a7f2bd8f710a593c8e1016","abstract_canon_sha256":"a411a5d583bfed4bc91e42134491d83a3cbd1c6ff340ee15f50ad352579d0910"},"schema_version":"1.0"},"canonical_sha256":"84997d63bfc37905cb6491e6c9b4f45f48a40719c79f9d5206b51acb6d8b7b8b","source":{"kind":"arxiv","id":"1906.09890","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.09890","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"arxiv_version","alias_value":"1906.09890v2","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.09890","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"pith_short_12","alias_value":"QSMX2Y57YN4Q","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"QSMX2Y57YN4QLS3E","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"QSMX2Y57","created_at":"2026-05-18T12:33:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:QSMX2Y57YN4QLS3ESHTMTNHUL5","target":"record","payload":{"canonical_record":{"source":{"id":"1906.09890","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2019-06-24T12:44:09Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"f403bed1c2735889cda01a30c5fd58b5f7c916c978a7f2bd8f710a593c8e1016","abstract_canon_sha256":"a411a5d583bfed4bc91e42134491d83a3cbd1c6ff340ee15f50ad352579d0910"},"schema_version":"1.0"},"canonical_sha256":"84997d63bfc37905cb6491e6c9b4f45f48a40719c79f9d5206b51acb6d8b7b8b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:41.712807Z","signature_b64":"taBuqKxoPpkByBI1urpZu5M28rTn1xDLn/moo7yrBcgSz/Ah+mo/CVc3TLSOgb0u+ZsiNQ3feTrNlOEzsi4YDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"84997d63bfc37905cb6491e6c9b4f45f48a40719c79f9d5206b51acb6d8b7b8b","last_reissued_at":"2026-05-17T23:41:41.712346Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:41.712346Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1906.09890","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5n0r9vxxn33VK0yf9cmqCL0FSR9xBFWxcUy5pmMNCDCOXfYfdeqKvlpkSPYLYoC1VrCXQyFxU6SVuHcOafwdDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T12:34:12.138860Z"},"content_sha256":"34d53f7948bc6b2d774be2f366f4e4b2f813b487f55f5203f6d7ab0b4a542c04","schema_version":"1.0","event_id":"sha256:34d53f7948bc6b2d774be2f366f4e4b2f813b487f55f5203f6d7ab0b4a542c04"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:QSMX2Y57YN4QLS3ESHTMTNHUL5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Self Multi-Head Attention for Speaker Recognition","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"cs.SD","authors_text":"Javier Hernando, Miquel India, Pooyan Safari","submitted_at":"2019-06-24T12:44:09Z","abstract_excerpt":"Most state-of-the-art Deep Learning (DL) approaches for speaker recognition work on a short utterance level. Given the speech signal, these algorithms extract a sequence of speaker embeddings from short segments and those are averaged to obtain an utterance level speaker representation. In this work we propose the use of an attention mechanism to obtain a discriminative speaker embedding given non fixed length speech utterances. Our system is based on a Convolutional Neural Network (CNN) that encodes short-term speaker features from the spectrogram and a self multi-head attention model that ma"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.09890","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IvhP9Jnv6zhsvAON7ygEKrkiOPutimPKZ3gfA8exc4OqRzMIstX/zdiGnXM7mZj0Wzg43YKk59yMeVqy1Pb+AA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T12:34:12.139217Z"},"content_sha256":"e80e2d62642b3440f72e56132596311c586ebc47c5030dba0a961f1715c89456","schema_version":"1.0","event_id":"sha256:e80e2d62642b3440f72e56132596311c586ebc47c5030dba0a961f1715c89456"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5/bundle.json","state_url":"https://pith.science/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T12:34:12Z","links":{"resolver":"https://pith.science/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5","bundle":"https://pith.science/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5/bundle.json","state":"https://pith.science/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/QSMX2Y57YN4QLS3ESHTMTNHUL5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:QSMX2Y57YN4QLS3ESHTMTNHUL5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a411a5d583bfed4bc91e42134491d83a3cbd1c6ff340ee15f50ad352579d0910","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2019-06-24T12:44:09Z","title_canon_sha256":"f403bed1c2735889cda01a30c5fd58b5f7c916c978a7f2bd8f710a593c8e1016"},"schema_version":"1.0","source":{"id":"1906.09890","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1906.09890","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"arxiv_version","alias_value":"1906.09890v2","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.09890","created_at":"2026-05-17T23:41:41Z"},{"alias_kind":"pith_short_12","alias_value":"QSMX2Y57YN4Q","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_16","alias_value":"QSMX2Y57YN4QLS3E","created_at":"2026-05-18T12:33:27Z"},{"alias_kind":"pith_short_8","alias_value":"QSMX2Y57","created_at":"2026-05-18T12:33:27Z"}],"graph_snapshots":[{"event_id":"sha256:e80e2d62642b3440f72e56132596311c586ebc47c5030dba0a961f1715c89456","target":"graph","created_at":"2026-05-17T23:41:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Most state-of-the-art Deep Learning (DL) approaches for speaker recognition work on a short utterance level. Given the speech signal, these algorithms extract a sequence of speaker embeddings from short segments and those are averaged to obtain an utterance level speaker representation. In this work we propose the use of an attention mechanism to obtain a discriminative speaker embedding given non fixed length speech utterances. Our system is based on a Convolutional Neural Network (CNN) that encodes short-term speaker features from the spectrogram and a self multi-head attention model that ma","authors_text":"Javier Hernando, Miquel India, Pooyan Safari","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2019-06-24T12:44:09Z","title":"Self Multi-Head Attention for Speaker Recognition"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.09890","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:34d53f7948bc6b2d774be2f366f4e4b2f813b487f55f5203f6d7ab0b4a542c04","target":"record","created_at":"2026-05-17T23:41:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a411a5d583bfed4bc91e42134491d83a3cbd1c6ff340ee15f50ad352579d0910","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2019-06-24T12:44:09Z","title_canon_sha256":"f403bed1c2735889cda01a30c5fd58b5f7c916c978a7f2bd8f710a593c8e1016"},"schema_version":"1.0","source":{"id":"1906.09890","kind":"arxiv","version":2}},"canonical_sha256":"84997d63bfc37905cb6491e6c9b4f45f48a40719c79f9d5206b51acb6d8b7b8b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"84997d63bfc37905cb6491e6c9b4f45f48a40719c79f9d5206b51acb6d8b7b8b","first_computed_at":"2026-05-17T23:41:41.712346Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:41.712346Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"taBuqKxoPpkByBI1urpZu5M28rTn1xDLn/moo7yrBcgSz/Ah+mo/CVc3TLSOgb0u+ZsiNQ3feTrNlOEzsi4YDQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:41.712807Z","signed_message":"canonical_sha256_bytes"},"source_id":"1906.09890","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:34d53f7948bc6b2d774be2f366f4e4b2f813b487f55f5203f6d7ab0b4a542c04","sha256:e80e2d62642b3440f72e56132596311c586ebc47c5030dba0a961f1715c89456"],"state_sha256":"6ea672120b24ca1e904e945cfdc8501f97a57d1ab600be9967a3caff0655737a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2n2oWBBZijWnLJSG3wQ4jaP1AXlNS1shJuPcsHS7ofRLM6tXQI7t9ePQY4Xp2TdKexnCsWlJg6Z8jtykg8JaBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T12:34:12.141612Z","bundle_sha256":"1869ced49654d44a227bf5e48512b231d8c66df25e70ea306987ed18985f24ad"}}