{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:5BG5CV5OU4WBHVSL3WUEXOEONE","short_pith_number":"pith:5BG5CV5O","canonical_record":{"source":{"id":"2606.28601","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-06-26T20:49:46Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"e922dab1988087b32fa47508fa0544d92d4c03d5e3c4fcacf7e76fd85dc84e2e","abstract_canon_sha256":"37b686e75ed5828141a31bb9a0cb94b9ac2ad5915a740326d76c8858f900fb1a"},"schema_version":"1.0"},"canonical_sha256":"e84dd157aea72c13d64bdda84bb88e6908faecb887514ffc9a29e868f192327f","source":{"kind":"arxiv","id":"2606.28601","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.28601","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"arxiv_version","alias_value":"2606.28601v1","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.28601","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"pith_short_12","alias_value":"5BG5CV5OU4WB","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"pith_short_16","alias_value":"5BG5CV5OU4WBHVSL","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"pith_short_8","alias_value":"5BG5CV5O","created_at":"2026-06-30T00:15:20Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:5BG5CV5OU4WBHVSL3WUEXOEONE","target":"record","payload":{"canonical_record":{"source":{"id":"2606.28601","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-06-26T20:49:46Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"e922dab1988087b32fa47508fa0544d92d4c03d5e3c4fcacf7e76fd85dc84e2e","abstract_canon_sha256":"37b686e75ed5828141a31bb9a0cb94b9ac2ad5915a740326d76c8858f900fb1a"},"schema_version":"1.0"},"canonical_sha256":"e84dd157aea72c13d64bdda84bb88e6908faecb887514ffc9a29e868f192327f","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-30T00:15:20.293073Z","signature_b64":"xqGx4VbP0uBzJ+vOcRSN2pcrACAqo2XW7IDAepkcsSKnm1Jy8o/PZP7TVeAkNxEumYYeq81kaxUlLQuO2cvtDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e84dd157aea72c13d64bdda84bb88e6908faecb887514ffc9a29e868f192327f","last_reissued_at":"2026-06-30T00:15:20.292669Z","signature_status":"signed_v1","first_computed_at":"2026-06-30T00:15:20.292669Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.28601","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T00:15:20Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IT017jLTky5fMhIWHzuFn2gC4zt4Xl6uiPAO7ANGz1NC85jhZwagD3VQWx3iHC6r5X+3wH+LodWMHJfqsbN/Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-03T06:12:54.625720Z"},"content_sha256":"71683f00ca2c280344e65274643bd67827101790e028b2b6a96e670e36f23eb9","schema_version":"1.0","event_id":"sha256:71683f00ca2c280344e65274643bd67827101790e028b2b6a96e670e36f23eb9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:5BG5CV5OU4WBHVSL3WUEXOEONE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Database Context Compression for Text-to-SQL on Real-World Large Databases","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.DB","authors_text":"Jingwen Liu, Junfeng Zhao, Weibin Liao, Xin Gao, Yasha Wang","submitted_at":"2026-06-26T20:49:46Z","abstract_excerpt":"Recent progress in Text-to-SQL has been driven by stronger language models and prompting strategies, yet performance on real enterprise benchmarks such as Spider 2.0 and BIRD remains far below that on classical academic datasets. We argue that the main bottleneck is no longer reasoning, but database representation. Real databases contain repeated audit columns, large groups of similar tables, opaque identifiers whose meanings are stored only in documentation, and extensive data dictionaries with little query-relevant information. Existing query-aware methods, including schema linking and retri"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.28601","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.28601/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-30T00:15:20Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6mvdNJOV+jAEyazkk1p3vSLs/vJ9YOkR9zkVaOc8JvsoC0Rxym0Xs4R8dR/NkWfb6FdEzcSlC3Mh+f3Ou3dbCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-03T06:12:54.626092Z"},"content_sha256":"5b58f33439bcf8be9dcd5b76cf3647daa266ee2fbd711251a0b6080768b4bc9f","schema_version":"1.0","event_id":"sha256:5b58f33439bcf8be9dcd5b76cf3647daa266ee2fbd711251a0b6080768b4bc9f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5BG5CV5OU4WBHVSL3WUEXOEONE/bundle.json","state_url":"https://pith.science/pith/5BG5CV5OU4WBHVSL3WUEXOEONE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5BG5CV5OU4WBHVSL3WUEXOEONE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-03T06:12:54Z","links":{"resolver":"https://pith.science/pith/5BG5CV5OU4WBHVSL3WUEXOEONE","bundle":"https://pith.science/pith/5BG5CV5OU4WBHVSL3WUEXOEONE/bundle.json","state":"https://pith.science/pith/5BG5CV5OU4WBHVSL3WUEXOEONE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5BG5CV5OU4WBHVSL3WUEXOEONE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5BG5CV5OU4WBHVSL3WUEXOEONE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"37b686e75ed5828141a31bb9a0cb94b9ac2ad5915a740326d76c8858f900fb1a","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-06-26T20:49:46Z","title_canon_sha256":"e922dab1988087b32fa47508fa0544d92d4c03d5e3c4fcacf7e76fd85dc84e2e"},"schema_version":"1.0","source":{"id":"2606.28601","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.28601","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"arxiv_version","alias_value":"2606.28601v1","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.28601","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"pith_short_12","alias_value":"5BG5CV5OU4WB","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"pith_short_16","alias_value":"5BG5CV5OU4WBHVSL","created_at":"2026-06-30T00:15:20Z"},{"alias_kind":"pith_short_8","alias_value":"5BG5CV5O","created_at":"2026-06-30T00:15:20Z"}],"graph_snapshots":[{"event_id":"sha256:5b58f33439bcf8be9dcd5b76cf3647daa266ee2fbd711251a0b6080768b4bc9f","target":"graph","created_at":"2026-06-30T00:15:20Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.28601/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Recent progress in Text-to-SQL has been driven by stronger language models and prompting strategies, yet performance on real enterprise benchmarks such as Spider 2.0 and BIRD remains far below that on classical academic datasets. We argue that the main bottleneck is no longer reasoning, but database representation. Real databases contain repeated audit columns, large groups of similar tables, opaque identifiers whose meanings are stored only in documentation, and extensive data dictionaries with little query-relevant information. Existing query-aware methods, including schema linking and retri","authors_text":"Jingwen Liu, Junfeng Zhao, Weibin Liao, Xin Gao, Yasha Wang","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-06-26T20:49:46Z","title":"Database Context Compression for Text-to-SQL on Real-World Large Databases"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.28601","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:71683f00ca2c280344e65274643bd67827101790e028b2b6a96e670e36f23eb9","target":"record","created_at":"2026-06-30T00:15:20Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"37b686e75ed5828141a31bb9a0cb94b9ac2ad5915a740326d76c8858f900fb1a","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.DB","submitted_at":"2026-06-26T20:49:46Z","title_canon_sha256":"e922dab1988087b32fa47508fa0544d92d4c03d5e3c4fcacf7e76fd85dc84e2e"},"schema_version":"1.0","source":{"id":"2606.28601","kind":"arxiv","version":1}},"canonical_sha256":"e84dd157aea72c13d64bdda84bb88e6908faecb887514ffc9a29e868f192327f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e84dd157aea72c13d64bdda84bb88e6908faecb887514ffc9a29e868f192327f","first_computed_at":"2026-06-30T00:15:20.292669Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T00:15:20.292669Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"xqGx4VbP0uBzJ+vOcRSN2pcrACAqo2XW7IDAepkcsSKnm1Jy8o/PZP7TVeAkNxEumYYeq81kaxUlLQuO2cvtDg==","signature_status":"signed_v1","signed_at":"2026-06-30T00:15:20.293073Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.28601","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:71683f00ca2c280344e65274643bd67827101790e028b2b6a96e670e36f23eb9","sha256:5b58f33439bcf8be9dcd5b76cf3647daa266ee2fbd711251a0b6080768b4bc9f"],"state_sha256":"7b263712d4783f0973d1a90e56aecf1db6cbfbff5de139623dd921b4e6f1a526"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ibik2hLEXfnSpAMl34Z1Ltdtqxv4TBrX9lbAuhFl0cpEMoMBXM0DjoRw8rJEeGc0wkgUmmAb91WXbIZ4a3u9Dg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-03T06:12:54.628045Z","bundle_sha256":"9dd8e4add7b0627ac555e4c67429822ca4616e446c80691e9339bc125716c1bc"}}