{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:443LYT3PP5D45LV2GO6WXEI5RD","short_pith_number":"pith:443LYT3P","canonical_record":{"source":{"id":"2606.08615","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-07T13:00:19Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"ee11f3b7a991e85a0c465338ecf4075e3dcace2213e1f86c031581d5f28b56d0","abstract_canon_sha256":"57e607be7398b513c69ec9a6cd880f30ebba14f7f78353c04c774cb914857996"},"schema_version":"1.0"},"canonical_sha256":"e736bc4f6f7f47ceaeba33bd6b911d88f4bad3a1cdbf073245854f93762c9ebe","source":{"kind":"arxiv","id":"2606.08615","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.08615","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"arxiv_version","alias_value":"2606.08615v1","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.08615","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"pith_short_12","alias_value":"443LYT3PP5D4","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"pith_short_16","alias_value":"443LYT3PP5D45LV2","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"pith_short_8","alias_value":"443LYT3P","created_at":"2026-06-09T01:05:41Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:443LYT3PP5D45LV2GO6WXEI5RD","target":"record","payload":{"canonical_record":{"source":{"id":"2606.08615","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-07T13:00:19Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"ee11f3b7a991e85a0c465338ecf4075e3dcace2213e1f86c031581d5f28b56d0","abstract_canon_sha256":"57e607be7398b513c69ec9a6cd880f30ebba14f7f78353c04c774cb914857996"},"schema_version":"1.0"},"canonical_sha256":"e736bc4f6f7f47ceaeba33bd6b911d88f4bad3a1cdbf073245854f93762c9ebe","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T01:05:41.566098Z","signature_b64":"44soJov04yLzBenEcKQTXJyJlU42yo09b0z6ATrQEZsiBghxjYK1KIMZH1rb6CQfw4MGP3GzQ1HuDdZKaioSAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e736bc4f6f7f47ceaeba33bd6b911d88f4bad3a1cdbf073245854f93762c9ebe","last_reissued_at":"2026-06-09T01:05:41.565628Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T01:05:41.565628Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.08615","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:05:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oI+oJbzbcim9GeaFQF8uQzIuhSzk7lK+9Ymukf5ueQF3X/lgmLrLAxJby/inoXSVjuRi14TqlrTrb19xB3ZUBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T10:58:56.434269Z"},"content_sha256":"30c3a65748d503534d21b4090a631bc185e2984841de28338b49523386b7a68d","schema_version":"1.0","event_id":"sha256:30c3a65748d503534d21b4090a631bc185e2984841de28338b49523386b7a68d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:443LYT3PP5D45LV2GO6WXEI5RD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Harnessing Streaming Video in the Wild","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.CV","authors_text":"Chenxu Yang, Chuanyu Qin, Dingyu Yao, Jiaqi Wang, Junhao Zhou, Naibin Gu, Nan Duan, Qingyi Si, Shuhuan Gu, Weiping Wang, Zheng Lin","submitted_at":"2026-06-07T13:00:19Z","abstract_excerpt":"Vision-Language Models (VLMs) are increasingly required to process unbounded video streams in applications such as video-call assistants, live commentary, and embodied robots. An ideal streaming system should support proactive interaction, long-horizon memory, and real-time processing, while resting on a VLM backbone capable of handling diverse in-the-wild streaming tasks. However, existing VLMs excel at offline video understanding but fall short in streaming capabilities and lack dedicated infrastructure for streaming deployment. We address this gap on three fronts. (i) For backbone capabilit"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.08615","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.08615/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:05:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Tlx3Bs1MrE5flJGfkQ0QwzAMZFhn7vCX7KXN4+5NqxfrSiUJM/NZWdZa6Luj3GqljnOhObXWA9AX6oRCrDbVAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T10:58:56.434641Z"},"content_sha256":"c9a89bb9e681595e4ef66b7b83961a6dc384e76d42c97b7d9b197e5880ac0f53","schema_version":"1.0","event_id":"sha256:c9a89bb9e681595e4ef66b7b83961a6dc384e76d42c97b7d9b197e5880ac0f53"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/443LYT3PP5D45LV2GO6WXEI5RD/bundle.json","state_url":"https://pith.science/pith/443LYT3PP5D45LV2GO6WXEI5RD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/443LYT3PP5D45LV2GO6WXEI5RD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T10:58:56Z","links":{"resolver":"https://pith.science/pith/443LYT3PP5D45LV2GO6WXEI5RD","bundle":"https://pith.science/pith/443LYT3PP5D45LV2GO6WXEI5RD/bundle.json","state":"https://pith.science/pith/443LYT3PP5D45LV2GO6WXEI5RD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/443LYT3PP5D45LV2GO6WXEI5RD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:443LYT3PP5D45LV2GO6WXEI5RD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"57e607be7398b513c69ec9a6cd880f30ebba14f7f78353c04c774cb914857996","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-07T13:00:19Z","title_canon_sha256":"ee11f3b7a991e85a0c465338ecf4075e3dcace2213e1f86c031581d5f28b56d0"},"schema_version":"1.0","source":{"id":"2606.08615","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.08615","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"arxiv_version","alias_value":"2606.08615v1","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.08615","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"pith_short_12","alias_value":"443LYT3PP5D4","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"pith_short_16","alias_value":"443LYT3PP5D45LV2","created_at":"2026-06-09T01:05:41Z"},{"alias_kind":"pith_short_8","alias_value":"443LYT3P","created_at":"2026-06-09T01:05:41Z"}],"graph_snapshots":[{"event_id":"sha256:c9a89bb9e681595e4ef66b7b83961a6dc384e76d42c97b7d9b197e5880ac0f53","target":"graph","created_at":"2026-06-09T01:05:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.08615/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Vision-Language Models (VLMs) are increasingly required to process unbounded video streams in applications such as video-call assistants, live commentary, and embodied robots. An ideal streaming system should support proactive interaction, long-horizon memory, and real-time processing, while resting on a VLM backbone capable of handling diverse in-the-wild streaming tasks. However, existing VLMs excel at offline video understanding but fall short in streaming capabilities and lack dedicated infrastructure for streaming deployment. We address this gap on three fronts. (i) For backbone capabilit","authors_text":"Chenxu Yang, Chuanyu Qin, Dingyu Yao, Jiaqi Wang, Junhao Zhou, Naibin Gu, Nan Duan, Qingyi Si, Shuhuan Gu, Weiping Wang, Zheng Lin","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-07T13:00:19Z","title":"Harnessing Streaming Video in the Wild"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.08615","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:30c3a65748d503534d21b4090a631bc185e2984841de28338b49523386b7a68d","target":"record","created_at":"2026-06-09T01:05:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"57e607be7398b513c69ec9a6cd880f30ebba14f7f78353c04c774cb914857996","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-07T13:00:19Z","title_canon_sha256":"ee11f3b7a991e85a0c465338ecf4075e3dcace2213e1f86c031581d5f28b56d0"},"schema_version":"1.0","source":{"id":"2606.08615","kind":"arxiv","version":1}},"canonical_sha256":"e736bc4f6f7f47ceaeba33bd6b911d88f4bad3a1cdbf073245854f93762c9ebe","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e736bc4f6f7f47ceaeba33bd6b911d88f4bad3a1cdbf073245854f93762c9ebe","first_computed_at":"2026-06-09T01:05:41.565628Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T01:05:41.565628Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"44soJov04yLzBenEcKQTXJyJlU42yo09b0z6ATrQEZsiBghxjYK1KIMZH1rb6CQfw4MGP3GzQ1HuDdZKaioSAg==","signature_status":"signed_v1","signed_at":"2026-06-09T01:05:41.566098Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.08615","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:30c3a65748d503534d21b4090a631bc185e2984841de28338b49523386b7a68d","sha256:c9a89bb9e681595e4ef66b7b83961a6dc384e76d42c97b7d9b197e5880ac0f53"],"state_sha256":"c8b5e3cf398c53e1b0c1f8b71e22b752effbd7bd42aebef9b0c2410b4ec48ef8"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZZFTECVV3c7VTnqaEJDGW7/yJ5+GuJ1gjNj+ZnVslF1m/3NZCA7M3397hL4u/8M1YqFK6iivnDzHkAkW1TWPCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T10:58:56.436647Z","bundle_sha256":"3dc0c3f1dd54b6a386c04803db35210db3c8bbbdc8595005c9efa5e24740d389"}}