{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:IQ3HSRYAE244JRZX66G6PEE6R3","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"961675134f2d5e09ea582190744999ce0180bb556d221d524f3d9640438f60a0","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-01T15:54:13Z","title_canon_sha256":"0f0fd5be5b59a96182c01d9b7c60e094a1d914e8a63ca63deb5f34c2f72dc097"},"schema_version":"1.0","source":{"id":"2607.01237","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2607.01237","created_at":"2026-07-03T00:16:54Z"},{"alias_kind":"arxiv_version","alias_value":"2607.01237v1","created_at":"2026-07-03T00:16:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2607.01237","created_at":"2026-07-03T00:16:54Z"},{"alias_kind":"pith_short_12","alias_value":"IQ3HSRYAE244","created_at":"2026-07-03T00:16:54Z"},{"alias_kind":"pith_short_16","alias_value":"IQ3HSRYAE244JRZX","created_at":"2026-07-03T00:16:54Z"},{"alias_kind":"pith_short_8","alias_value":"IQ3HSRYA","created_at":"2026-07-03T00:16:54Z"}],"graph_snapshots":[{"event_id":"sha256:9c91ba65992efa0857ae44d8662e4ecb5db8f739e736b5deb06f7c7973ca5ac9","target":"graph","created_at":"2026-07-03T00:16:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2607.01237/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reasoning language models often generate long chain-of-thought (CoT), which accumulates a massive KV cache during the decoding phase and incurs high decoding latency and limited throughput. To address these issues, KV cache compression has emerged as a promising technique for reducing memory overhead by selectively removing unimportant KV pairs while preserving useful ones for subsequent decoding. Nevertheless, we identify two key limitations in existing KV cache compression methods: 1) their threshold-triggered compression policy may provide limited throughput improvement or even reduce throu","authors_text":"Shen Han, Yuyang Wu","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-01T15:54:13Z","title":"Kara: Efficient Reasoning LLM Serving via Sliding-Window KV Cache Compression"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2607.01237","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:64e72e4d7434e9f48dd2255485e8eeb8eb5322816ecc33e2e98001306eb2bb71","target":"record","created_at":"2026-07-03T00:16:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"961675134f2d5e09ea582190744999ce0180bb556d221d524f3d9640438f60a0","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-01T15:54:13Z","title_canon_sha256":"0f0fd5be5b59a96182c01d9b7c60e094a1d914e8a63ca63deb5f34c2f72dc097"},"schema_version":"1.0","source":{"id":"2607.01237","kind":"arxiv","version":1}},"canonical_sha256":"443679470026b9c4c737f78de7909e8ee44da86a750c0a7c670f31b8987295cb","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"443679470026b9c4c737f78de7909e8ee44da86a750c0a7c670f31b8987295cb","first_computed_at":"2026-07-03T00:16:54.999621Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-03T00:16:54.999621Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1taRrBGeDcV/b+JCFvBSgkU+EymjIiXZPfxleoR4VCm5+gw8enuFeD/kV7XUdvzeQPjhq1Mh5YEiLh3cg/rMDg==","signature_status":"signed_v1","signed_at":"2026-07-03T00:16:54.999982Z","signed_message":"canonical_sha256_bytes"},"source_id":"2607.01237","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:64e72e4d7434e9f48dd2255485e8eeb8eb5322816ecc33e2e98001306eb2bb71","sha256:9c91ba65992efa0857ae44d8662e4ecb5db8f739e736b5deb06f7c7973ca5ac9"],"state_sha256":"46af23c28deb36b9858b32001e31e4698953c92ac5e63b921fc3f518bbe1fed2"}