{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:CUO2QMQVV5R3TTVXUJFHHDCFD6","short_pith_number":"pith:CUO2QMQV","canonical_record":{"source":{"id":"2606.24477","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T12:13:19Z","cross_cats_sorted":["cs.AI","cs.SD"],"title_canon_sha256":"0bad93b7475fbfc6d7f9e4db852e1c9068b53fad117fde9b2167bb8e92ae9bf4","abstract_canon_sha256":"909bc94edbf522cbf71f28967e4f352c077fae09985ef58f6c72c5af1ca4edc0"},"schema_version":"1.0"},"canonical_sha256":"151da83215af63b9ceb7a24a738c451fb445bdf916bb873da8cc78a2d58e2b25","source":{"kind":"arxiv","id":"2606.24477","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24477","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24477v1","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24477","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_12","alias_value":"CUO2QMQVV5R3","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_16","alias_value":"CUO2QMQVV5R3TTVX","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_8","alias_value":"CUO2QMQV","created_at":"2026-06-24T01:15:31Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:CUO2QMQVV5R3TTVXUJFHHDCFD6","target":"record","payload":{"canonical_record":{"source":{"id":"2606.24477","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T12:13:19Z","cross_cats_sorted":["cs.AI","cs.SD"],"title_canon_sha256":"0bad93b7475fbfc6d7f9e4db852e1c9068b53fad117fde9b2167bb8e92ae9bf4","abstract_canon_sha256":"909bc94edbf522cbf71f28967e4f352c077fae09985ef58f6c72c5af1ca4edc0"},"schema_version":"1.0"},"canonical_sha256":"151da83215af63b9ceb7a24a738c451fb445bdf916bb873da8cc78a2d58e2b25","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-24T01:15:31.608053Z","signature_b64":"oON0NyKW+4iGwW971RX5Z3+ySDtz+jV4zQfKkBo3xtg7E+9NQ7LIQSQoYw4h4OrTDRRZTuTIhIWNy+B7JfhGAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"151da83215af63b9ceb7a24a738c451fb445bdf916bb873da8cc78a2d58e2b25","last_reissued_at":"2026-06-24T01:15:31.607660Z","signature_status":"signed_v1","first_computed_at":"2026-06-24T01:15:31.607660Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.24477","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:15:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/0/X3RKn+ZDph8/ziXjPJGVfB3/2kk2fkWiiwHpAssfK6bm7LBXOloDktUrK2YZqRqvddLWjZiXc5ac53lNlBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-27T17:12:53.570605Z"},"content_sha256":"e387f2ab2c63ac48f6c718762d5e0e4d16cea6064f3a75c9ca9e4df6c63da36e","schema_version":"1.0","event_id":"sha256:e387f2ab2c63ac48f6c718762d5e0e4d16cea6064f3a75c9ca9e4df6c63da36e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:CUO2QMQVV5R3TTVXUJFHHDCFD6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"video-SALMONN-R$^3$: Learning to ReWatch, ReAsk, and ReAnswer for Efficient Video Understanding","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.SD"],"primary_cat":"cs.CV","authors_text":"Chao Zhang, Guangzhi Sun, Wei Li, Yixuan Li, Yudong Yang, Zejun Ma","submitted_at":"2026-06-23T12:13:19Z","abstract_excerpt":"Video large language models (LLMs) are often constrained by computation and memory budgets, leading them to use reduced frame rates and spatial resolutions, which may cause them to miss critical information for question answering (QA). A practical and efficient solution is a two-stage paradigm: first perform coarse video understanding to localize relevant segments, and then re-watch these segments at higher temporal or spatial fidelity. In this paper, we present video-SALMONN-R$^3$, the first end-to-end video-LLM that enables re-watch through reinforcement learning without relying on chain-of-"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24477","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.24477/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:15:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CueoFLc83Fruwi/VDDl7YRWNYANRpN21cnb+4QKbwDohhQ6DqekIBbVq1nIAwUUzO3Vkt/OSqiPcR77cQaTpAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-27T17:12:53.570979Z"},"content_sha256":"8445e84818b57a3ccca505d2217ff76b8f8376f6664f9590c8e6c0f26b1726c6","schema_version":"1.0","event_id":"sha256:8445e84818b57a3ccca505d2217ff76b8f8376f6664f9590c8e6c0f26b1726c6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6/bundle.json","state_url":"https://pith.science/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-27T17:12:53Z","links":{"resolver":"https://pith.science/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6","bundle":"https://pith.science/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6/bundle.json","state":"https://pith.science/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CUO2QMQVV5R3TTVXUJFHHDCFD6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:CUO2QMQVV5R3TTVXUJFHHDCFD6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"909bc94edbf522cbf71f28967e4f352c077fae09985ef58f6c72c5af1ca4edc0","cross_cats_sorted":["cs.AI","cs.SD"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T12:13:19Z","title_canon_sha256":"0bad93b7475fbfc6d7f9e4db852e1c9068b53fad117fde9b2167bb8e92ae9bf4"},"schema_version":"1.0","source":{"id":"2606.24477","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24477","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24477v1","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24477","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_12","alias_value":"CUO2QMQVV5R3","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_16","alias_value":"CUO2QMQVV5R3TTVX","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_8","alias_value":"CUO2QMQV","created_at":"2026-06-24T01:15:31Z"}],"graph_snapshots":[{"event_id":"sha256:8445e84818b57a3ccca505d2217ff76b8f8376f6664f9590c8e6c0f26b1726c6","target":"graph","created_at":"2026-06-24T01:15:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.24477/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Video large language models (LLMs) are often constrained by computation and memory budgets, leading them to use reduced frame rates and spatial resolutions, which may cause them to miss critical information for question answering (QA). A practical and efficient solution is a two-stage paradigm: first perform coarse video understanding to localize relevant segments, and then re-watch these segments at higher temporal or spatial fidelity. In this paper, we present video-SALMONN-R$^3$, the first end-to-end video-LLM that enables re-watch through reinforcement learning without relying on chain-of-","authors_text":"Chao Zhang, Guangzhi Sun, Wei Li, Yixuan Li, Yudong Yang, Zejun Ma","cross_cats":["cs.AI","cs.SD"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T12:13:19Z","title":"video-SALMONN-R$^3$: Learning to ReWatch, ReAsk, and ReAnswer for Efficient Video Understanding"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24477","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e387f2ab2c63ac48f6c718762d5e0e4d16cea6064f3a75c9ca9e4df6c63da36e","target":"record","created_at":"2026-06-24T01:15:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"909bc94edbf522cbf71f28967e4f352c077fae09985ef58f6c72c5af1ca4edc0","cross_cats_sorted":["cs.AI","cs.SD"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-23T12:13:19Z","title_canon_sha256":"0bad93b7475fbfc6d7f9e4db852e1c9068b53fad117fde9b2167bb8e92ae9bf4"},"schema_version":"1.0","source":{"id":"2606.24477","kind":"arxiv","version":1}},"canonical_sha256":"151da83215af63b9ceb7a24a738c451fb445bdf916bb873da8cc78a2d58e2b25","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"151da83215af63b9ceb7a24a738c451fb445bdf916bb873da8cc78a2d58e2b25","first_computed_at":"2026-06-24T01:15:31.607660Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-24T01:15:31.607660Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"oON0NyKW+4iGwW971RX5Z3+ySDtz+jV4zQfKkBo3xtg7E+9NQ7LIQSQoYw4h4OrTDRRZTuTIhIWNy+B7JfhGAw==","signature_status":"signed_v1","signed_at":"2026-06-24T01:15:31.608053Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.24477","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e387f2ab2c63ac48f6c718762d5e0e4d16cea6064f3a75c9ca9e4df6c63da36e","sha256:8445e84818b57a3ccca505d2217ff76b8f8376f6664f9590c8e6c0f26b1726c6"],"state_sha256":"230b7eae26715be4485a1c9127c580a83566eb5c2e7b0a9d7732d8066de50326"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2Fmk9cH6Afyp+WgBhaZ6dzURp9SBUpCtDMru2pUkO413O4K2ezecbV6kKXqq25G9eUG3OZS+x7nbiNfhsD0jBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-27T17:12:53.572905Z","bundle_sha256":"7d80850eb037149276321e342ce29cc99cc8275d4e65e39853342e610cf088ec"}}