{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:LRG5AOLD6PIPQ6IJYHJCTPPPHD","short_pith_number":"pith:LRG5AOLD","canonical_record":{"source":{"id":"1711.10133","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-28T05:43:44Z","cross_cats_sorted":[],"title_canon_sha256":"e4b5a48438f4205c061fa37763d0b95337d4aab991ea492b6a7098c2514004d0","abstract_canon_sha256":"9147757149edab6ccea6bdf2b20e296f82287b4077c656db0d50ef72a083544b"},"schema_version":"1.0"},"canonical_sha256":"5c4dd03963f3d0f87909c1d229bdef38c3aa9c02a8a779b8247508885152d027","source":{"kind":"arxiv","id":"1711.10133","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.10133","created_at":"2026-05-18T00:29:23Z"},{"alias_kind":"arxiv_version","alias_value":"1711.10133v1","created_at":"2026-05-18T00:29:23Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.10133","created_at":"2026-05-18T00:29:23Z"},{"alias_kind":"pith_short_12","alias_value":"LRG5AOLD6PIP","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"LRG5AOLD6PIPQ6IJ","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"LRG5AOLD","created_at":"2026-05-18T12:31:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:LRG5AOLD6PIPQ6IJYHJCTPPPHD","target":"record","payload":{"canonical_record":{"source":{"id":"1711.10133","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-28T05:43:44Z","cross_cats_sorted":[],"title_canon_sha256":"e4b5a48438f4205c061fa37763d0b95337d4aab991ea492b6a7098c2514004d0","abstract_canon_sha256":"9147757149edab6ccea6bdf2b20e296f82287b4077c656db0d50ef72a083544b"},"schema_version":"1.0"},"canonical_sha256":"5c4dd03963f3d0f87909c1d229bdef38c3aa9c02a8a779b8247508885152d027","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:29:23.293441Z","signature_b64":"5YuPipfm/uom8QatjsNWmbYwszj8kYBlTTcZxf+emMamQO0eCwfB3vT5RhzVDaDN0h3zhyBzrs7ComSBlK0oBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5c4dd03963f3d0f87909c1d229bdef38c3aa9c02a8a779b8247508885152d027","last_reissued_at":"2026-05-18T00:29:23.292662Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:29:23.292662Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1711.10133","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:29:23Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qnCyVfsMAQCKww0HawCaJzYrqcp19yBl45BteSKuI/UcFuByl3ZTF/aTbPKupzKf/cY5Z39gDYdQm2FrNncjCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-22T16:04:40.848939Z"},"content_sha256":"a64f5339705a443a12c0b98c42d3dbb8179baa7b146395222e7b7329196bfb49","schema_version":"1.0","event_id":"sha256:a64f5339705a443a12c0b98c42d3dbb8179baa7b146395222e7b7329196bfb49"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:LRG5AOLD6PIPQ6IJYHJCTPPPHD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Unsupervised Discovery of Structured Acoustic Tokens with Applications to Spoken Term Detection","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Cheng-Tao Chung, Lin-shan Lee","submitted_at":"2017-11-28T05:43:44Z","abstract_excerpt":"In this paper, we compare two paradigms for unsupervised discovery of structured acoustic tokens directly from speech corpora without any human annotation. The Multigranular Paradigm seeks to capture all available information in the corpora with multiple sets of tokens for different model granularities. The Hierarchical Paradigm attempts to jointly learn several levels of signal representations in a hierarchical structure. The two paradigms are unified within a theoretical framework in this paper. Query-by-Example Spoken Term Detection (QbE-STD) experiments on the QUESST dataset of MediaEval 2"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.10133","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:29:23Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ceZstDLnPxtTyh4qvV8ZBTUtKiY0IQsu5wbNjlx+clVJm3XRkLpvigUXx8pblpVC7ZiOTD4DugOWDuikmep6DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-22T16:04:40.849288Z"},"content_sha256":"d5bf83d3c5234aed1bfed3171f8371e0fe2fa3107f05442972ddc5985286831d","schema_version":"1.0","event_id":"sha256:d5bf83d3c5234aed1bfed3171f8371e0fe2fa3107f05442972ddc5985286831d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD/bundle.json","state_url":"https://pith.science/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-22T16:04:40Z","links":{"resolver":"https://pith.science/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD","bundle":"https://pith.science/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD/bundle.json","state":"https://pith.science/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LRG5AOLD6PIPQ6IJYHJCTPPPHD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:LRG5AOLD6PIPQ6IJYHJCTPPPHD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9147757149edab6ccea6bdf2b20e296f82287b4077c656db0d50ef72a083544b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-28T05:43:44Z","title_canon_sha256":"e4b5a48438f4205c061fa37763d0b95337d4aab991ea492b6a7098c2514004d0"},"schema_version":"1.0","source":{"id":"1711.10133","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.10133","created_at":"2026-05-18T00:29:23Z"},{"alias_kind":"arxiv_version","alias_value":"1711.10133v1","created_at":"2026-05-18T00:29:23Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.10133","created_at":"2026-05-18T00:29:23Z"},{"alias_kind":"pith_short_12","alias_value":"LRG5AOLD6PIP","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"LRG5AOLD6PIPQ6IJ","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"LRG5AOLD","created_at":"2026-05-18T12:31:28Z"}],"graph_snapshots":[{"event_id":"sha256:d5bf83d3c5234aed1bfed3171f8371e0fe2fa3107f05442972ddc5985286831d","target":"graph","created_at":"2026-05-18T00:29:23Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we compare two paradigms for unsupervised discovery of structured acoustic tokens directly from speech corpora without any human annotation. The Multigranular Paradigm seeks to capture all available information in the corpora with multiple sets of tokens for different model granularities. The Hierarchical Paradigm attempts to jointly learn several levels of signal representations in a hierarchical structure. The two paradigms are unified within a theoretical framework in this paper. Query-by-Example Spoken Term Detection (QbE-STD) experiments on the QUESST dataset of MediaEval 2","authors_text":"Cheng-Tao Chung, Lin-shan Lee","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-28T05:43:44Z","title":"Unsupervised Discovery of Structured Acoustic Tokens with Applications to Spoken Term Detection"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.10133","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a64f5339705a443a12c0b98c42d3dbb8179baa7b146395222e7b7329196bfb49","target":"record","created_at":"2026-05-18T00:29:23Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9147757149edab6ccea6bdf2b20e296f82287b4077c656db0d50ef72a083544b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-11-28T05:43:44Z","title_canon_sha256":"e4b5a48438f4205c061fa37763d0b95337d4aab991ea492b6a7098c2514004d0"},"schema_version":"1.0","source":{"id":"1711.10133","kind":"arxiv","version":1}},"canonical_sha256":"5c4dd03963f3d0f87909c1d229bdef38c3aa9c02a8a779b8247508885152d027","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5c4dd03963f3d0f87909c1d229bdef38c3aa9c02a8a779b8247508885152d027","first_computed_at":"2026-05-18T00:29:23.292662Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:29:23.292662Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"5YuPipfm/uom8QatjsNWmbYwszj8kYBlTTcZxf+emMamQO0eCwfB3vT5RhzVDaDN0h3zhyBzrs7ComSBlK0oBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:29:23.293441Z","signed_message":"canonical_sha256_bytes"},"source_id":"1711.10133","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a64f5339705a443a12c0b98c42d3dbb8179baa7b146395222e7b7329196bfb49","sha256:d5bf83d3c5234aed1bfed3171f8371e0fe2fa3107f05442972ddc5985286831d"],"state_sha256":"ea48a19dee8d957a714418b9962b0ed639d5b224325095069fd6ccdb92441ba1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Nxq2HFsFEKKmE0iQpPtSfk5KyGQ8SY33dhHdbQV3yb1dmKq+etTDJiYcnM5kfggQhpY2HAfmSjl8t8cwupkaAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-22T16:04:40.851224Z","bundle_sha256":"75cc6b53b053474c73365bae6b288583f248e5e1d82b179a5b933f6513b8b94a"}}