{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:XZMN76TQOO2UNVIMLR2P3RGZG5","short_pith_number":"pith:XZMN76TQ","canonical_record":{"source":{"id":"2606.05568","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2026-06-04T01:28:45Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"3154cb489dffd91a0ee05aff36c23811fa2d8d3f5338ecf60318a9822f2f6045","abstract_canon_sha256":"5f7e4f42fd726ff393b7989b72ad39d248a5501a4f31474a480aa61377f6c1b7"},"schema_version":"1.0"},"canonical_sha256":"be58dffa7073b546d50c5c74fdc4d937550a74081810d38d8be689ea4cd283f7","source":{"kind":"arxiv","id":"2606.05568","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.05568","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"arxiv_version","alias_value":"2606.05568v1","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.05568","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_12","alias_value":"XZMN76TQOO2U","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_16","alias_value":"XZMN76TQOO2UNVIM","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_8","alias_value":"XZMN76TQ","created_at":"2026-06-05T01:14:55Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:XZMN76TQOO2UNVIMLR2P3RGZG5","target":"record","payload":{"canonical_record":{"source":{"id":"2606.05568","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2026-06-04T01:28:45Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"3154cb489dffd91a0ee05aff36c23811fa2d8d3f5338ecf60318a9822f2f6045","abstract_canon_sha256":"5f7e4f42fd726ff393b7989b72ad39d248a5501a4f31474a480aa61377f6c1b7"},"schema_version":"1.0"},"canonical_sha256":"be58dffa7073b546d50c5c74fdc4d937550a74081810d38d8be689ea4cd283f7","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-05T01:14:55.140887Z","signature_b64":"P3eDlk67ZKQUtCBaOt0INf3BTV/Z5oXocZSF+SkX3LLIrX5OoIh0JZFCjzkn/weWjJE4wlzBBoNHc6IYL2tdDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"be58dffa7073b546d50c5c74fdc4d937550a74081810d38d8be689ea4cd283f7","last_reissued_at":"2026-06-05T01:14:55.140453Z","signature_status":"signed_v1","first_computed_at":"2026-06-05T01:14:55.140453Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.05568","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-05T01:14:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QwRvt+sk/0GobMRd+5HfPbdkNuJ/KhzL7nuTRSCgBFqK9fV89gCu2MXLz/y97fAav5I7uzTXga/A5f8X8mZbCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T16:18:09.880424Z"},"content_sha256":"f4c9235283a9ec4da3fc5f886a8a403766777875d74f4b8936f9c7f27418599e","schema_version":"1.0","event_id":"sha256:f4c9235283a9ec4da3fc5f886a8a403766777875d74f4b8936f9c7f27418599e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:XZMN76TQOO2UNVIMLR2P3RGZG5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"ColBERTSaR: Sparsified ColBERT Index via Product Quantization","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.IR","authors_text":"Andrew Yates, Dawn Lawrie, Eugene Yang, James Mayfield, Rohan Jha, Saron Samuel","submitted_at":"2026-06-04T01:28:45Z","abstract_excerpt":"While ColBERT is an effective neural retrieval architecture, it requires a heavy index structure to support candidate set retrieval based on approximated token embeddings, gathering and decompressing document token embeddings, and applying the MaxSim operation. Indexes in PLAID and similar ColBERT implementations require five to ten times the disk storage of the original raw text, which limits their scalability. Furthermore, prior work has identified that the gathering and decompression stages are the primary inefficiencies at query time. Limiting the number of document tokens that must be gat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.05568","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.05568/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-05T01:14:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fE3ZZrX+m+nCUjjQpedgPXVJ7gPMopfcJZ6lEJe1GjBJVAFJXk4BXLUAy37QnWFJsuAPEk0DuxDh5lgwmVuuCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T16:18:09.881217Z"},"content_sha256":"99d203c9f3005f1290f2b1232317495fa3daa510dfcf8c9eb88920402fdbb865","schema_version":"1.0","event_id":"sha256:99d203c9f3005f1290f2b1232317495fa3daa510dfcf8c9eb88920402fdbb865"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XZMN76TQOO2UNVIMLR2P3RGZG5/bundle.json","state_url":"https://pith.science/pith/XZMN76TQOO2UNVIMLR2P3RGZG5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XZMN76TQOO2UNVIMLR2P3RGZG5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T16:18:09Z","links":{"resolver":"https://pith.science/pith/XZMN76TQOO2UNVIMLR2P3RGZG5","bundle":"https://pith.science/pith/XZMN76TQOO2UNVIMLR2P3RGZG5/bundle.json","state":"https://pith.science/pith/XZMN76TQOO2UNVIMLR2P3RGZG5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XZMN76TQOO2UNVIMLR2P3RGZG5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:XZMN76TQOO2UNVIMLR2P3RGZG5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5f7e4f42fd726ff393b7989b72ad39d248a5501a4f31474a480aa61377f6c1b7","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2026-06-04T01:28:45Z","title_canon_sha256":"3154cb489dffd91a0ee05aff36c23811fa2d8d3f5338ecf60318a9822f2f6045"},"schema_version":"1.0","source":{"id":"2606.05568","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.05568","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"arxiv_version","alias_value":"2606.05568v1","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.05568","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_12","alias_value":"XZMN76TQOO2U","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_16","alias_value":"XZMN76TQOO2UNVIM","created_at":"2026-06-05T01:14:55Z"},{"alias_kind":"pith_short_8","alias_value":"XZMN76TQ","created_at":"2026-06-05T01:14:55Z"}],"graph_snapshots":[{"event_id":"sha256:99d203c9f3005f1290f2b1232317495fa3daa510dfcf8c9eb88920402fdbb865","target":"graph","created_at":"2026-06-05T01:14:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.05568/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While ColBERT is an effective neural retrieval architecture, it requires a heavy index structure to support candidate set retrieval based on approximated token embeddings, gathering and decompressing document token embeddings, and applying the MaxSim operation. Indexes in PLAID and similar ColBERT implementations require five to ten times the disk storage of the original raw text, which limits their scalability. Furthermore, prior work has identified that the gathering and decompression stages are the primary inefficiencies at query time. Limiting the number of document tokens that must be gat","authors_text":"Andrew Yates, Dawn Lawrie, Eugene Yang, James Mayfield, Rohan Jha, Saron Samuel","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2026-06-04T01:28:45Z","title":"ColBERTSaR: Sparsified ColBERT Index via Product Quantization"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.05568","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f4c9235283a9ec4da3fc5f886a8a403766777875d74f4b8936f9c7f27418599e","target":"record","created_at":"2026-06-05T01:14:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5f7e4f42fd726ff393b7989b72ad39d248a5501a4f31474a480aa61377f6c1b7","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.IR","submitted_at":"2026-06-04T01:28:45Z","title_canon_sha256":"3154cb489dffd91a0ee05aff36c23811fa2d8d3f5338ecf60318a9822f2f6045"},"schema_version":"1.0","source":{"id":"2606.05568","kind":"arxiv","version":1}},"canonical_sha256":"be58dffa7073b546d50c5c74fdc4d937550a74081810d38d8be689ea4cd283f7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"be58dffa7073b546d50c5c74fdc4d937550a74081810d38d8be689ea4cd283f7","first_computed_at":"2026-06-05T01:14:55.140453Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-05T01:14:55.140453Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"P3eDlk67ZKQUtCBaOt0INf3BTV/Z5oXocZSF+SkX3LLIrX5OoIh0JZFCjzkn/weWjJE4wlzBBoNHc6IYL2tdDA==","signature_status":"signed_v1","signed_at":"2026-06-05T01:14:55.140887Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.05568","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f4c9235283a9ec4da3fc5f886a8a403766777875d74f4b8936f9c7f27418599e","sha256:99d203c9f3005f1290f2b1232317495fa3daa510dfcf8c9eb88920402fdbb865"],"state_sha256":"61fefa616d2a971a1d67f7d4a02248c8366e434c3fd1ed079c00647aa8e04667"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vAv7yoLUCftDSQWhv45X6M2/Dn7majbYzIjgG38R98zXBfnIlGH4CMXeC+RFp1La6ca5q7gk2ACYX9hArDeZCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T16:18:09.885014Z","bundle_sha256":"46c3459d7da58316d7e1b74649c2544b9657f8b0d0d8bc139580c23900a87788"}}