{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:5RAOA7QQI4MQUYSWCUMT4QR73B","short_pith_number":"pith:5RAOA7QQ","canonical_record":{"source":{"id":"2606.27313","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-25T17:29:27Z","cross_cats_sorted":[],"title_canon_sha256":"ad85854e54d2aebbdb00288996714be6be89e9626c559af97addb0617b3c49a3","abstract_canon_sha256":"e6ad607eb650bba1e649d017513e2633b4ace74720f048589fed7187ac35c024"},"schema_version":"1.0"},"canonical_sha256":"ec40e07e1047190a625615193e423fd8729e5358fd7f5ef177b28b1644831229","source":{"kind":"arxiv","id":"2606.27313","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.27313","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"arxiv_version","alias_value":"2606.27313v1","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.27313","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"pith_short_12","alias_value":"5RAOA7QQI4MQ","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"pith_short_16","alias_value":"5RAOA7QQI4MQUYSW","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"pith_short_8","alias_value":"5RAOA7QQ","created_at":"2026-06-26T01:16:18Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:5RAOA7QQI4MQUYSWCUMT4QR73B","target":"record","payload":{"canonical_record":{"source":{"id":"2606.27313","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-25T17:29:27Z","cross_cats_sorted":[],"title_canon_sha256":"ad85854e54d2aebbdb00288996714be6be89e9626c559af97addb0617b3c49a3","abstract_canon_sha256":"e6ad607eb650bba1e649d017513e2633b4ace74720f048589fed7187ac35c024"},"schema_version":"1.0"},"canonical_sha256":"ec40e07e1047190a625615193e423fd8729e5358fd7f5ef177b28b1644831229","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-26T01:16:18.433968Z","signature_b64":"rOYPxkO38oN0L8Dw87HqPKirE13RCrjk5dxt/bL88G4NQwiQfLVmrI2hutMAnGsaLTsgspyauGb8KSw0EGf8CA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"ec40e07e1047190a625615193e423fd8729e5358fd7f5ef177b28b1644831229","last_reissued_at":"2026-06-26T01:16:18.433570Z","signature_status":"signed_v1","first_computed_at":"2026-06-26T01:16:18.433570Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.27313","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-26T01:16:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ueswVI3pXtouCAF/gpjrG1rHPeROs5KI/qgtE4pGt/Jhw4xTgMF1EAOu9fs8YQlR3KG75VwzYLMjFbny785eCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T16:42:25.387378Z"},"content_sha256":"a59a5597f6ecedbf1038c28a9e65b8f05f42da94eb4359a46d87662dac43aa63","schema_version":"1.0","event_id":"sha256:a59a5597f6ecedbf1038c28a9e65b8f05f42da94eb4359a46d87662dac43aa63"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:5RAOA7QQI4MQUYSWCUMT4QR73B","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"ViQ: Text-Aligned Visual Quantized Representations at Any Resolution","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Han Hu, Jiwen Lu, Shengsheng Qian, Xumin Yu, Yongming Rao, Yuhao Dong, Zhenyu Yang, Zuyan Liu","submitted_at":"2026-06-25T17:29:27Z","abstract_excerpt":"A unified representation for text and vision is a natural pursuit, as it enables simpler multimodal modeling and more efficient training. However, representing images as discrete signals in the same way as text inevitably introduces severe information loss. Existing work struggles to balance low-level details and high-level semantics in discrete representations: reconstruction-oriented representations often lack semantic information, whereas semantically stronger features typically suffer from severe loss of detail. We present ViQ, a Visual Quantized Representations framework, which is designe"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.27313","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.27313/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-26T01:16:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6z+O+ASDoy+V0JSs9U1osvT5elATCw1+hBLvLyNra/QCOlqLqlvA+0cJ4UnYsnyUWHuVDl80k5s1UaaO7UiiCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T16:42:25.387758Z"},"content_sha256":"02a5b659f85af05bca3bc5b72de98c3428989881b18a35ead738571ee1538ef6","schema_version":"1.0","event_id":"sha256:02a5b659f85af05bca3bc5b72de98c3428989881b18a35ead738571ee1538ef6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5RAOA7QQI4MQUYSWCUMT4QR73B/bundle.json","state_url":"https://pith.science/pith/5RAOA7QQI4MQUYSWCUMT4QR73B/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5RAOA7QQI4MQUYSWCUMT4QR73B/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-01T16:42:25Z","links":{"resolver":"https://pith.science/pith/5RAOA7QQI4MQUYSWCUMT4QR73B","bundle":"https://pith.science/pith/5RAOA7QQI4MQUYSWCUMT4QR73B/bundle.json","state":"https://pith.science/pith/5RAOA7QQI4MQUYSWCUMT4QR73B/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5RAOA7QQI4MQUYSWCUMT4QR73B/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5RAOA7QQI4MQUYSWCUMT4QR73B","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e6ad607eb650bba1e649d017513e2633b4ace74720f048589fed7187ac35c024","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-25T17:29:27Z","title_canon_sha256":"ad85854e54d2aebbdb00288996714be6be89e9626c559af97addb0617b3c49a3"},"schema_version":"1.0","source":{"id":"2606.27313","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.27313","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"arxiv_version","alias_value":"2606.27313v1","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.27313","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"pith_short_12","alias_value":"5RAOA7QQI4MQ","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"pith_short_16","alias_value":"5RAOA7QQI4MQUYSW","created_at":"2026-06-26T01:16:18Z"},{"alias_kind":"pith_short_8","alias_value":"5RAOA7QQ","created_at":"2026-06-26T01:16:18Z"}],"graph_snapshots":[{"event_id":"sha256:02a5b659f85af05bca3bc5b72de98c3428989881b18a35ead738571ee1538ef6","target":"graph","created_at":"2026-06-26T01:16:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.27313/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"A unified representation for text and vision is a natural pursuit, as it enables simpler multimodal modeling and more efficient training. However, representing images as discrete signals in the same way as text inevitably introduces severe information loss. Existing work struggles to balance low-level details and high-level semantics in discrete representations: reconstruction-oriented representations often lack semantic information, whereas semantically stronger features typically suffer from severe loss of detail. We present ViQ, a Visual Quantized Representations framework, which is designe","authors_text":"Han Hu, Jiwen Lu, Shengsheng Qian, Xumin Yu, Yongming Rao, Yuhao Dong, Zhenyu Yang, Zuyan Liu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-25T17:29:27Z","title":"ViQ: Text-Aligned Visual Quantized Representations at Any Resolution"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.27313","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a59a5597f6ecedbf1038c28a9e65b8f05f42da94eb4359a46d87662dac43aa63","target":"record","created_at":"2026-06-26T01:16:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e6ad607eb650bba1e649d017513e2633b4ace74720f048589fed7187ac35c024","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-25T17:29:27Z","title_canon_sha256":"ad85854e54d2aebbdb00288996714be6be89e9626c559af97addb0617b3c49a3"},"schema_version":"1.0","source":{"id":"2606.27313","kind":"arxiv","version":1}},"canonical_sha256":"ec40e07e1047190a625615193e423fd8729e5358fd7f5ef177b28b1644831229","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ec40e07e1047190a625615193e423fd8729e5358fd7f5ef177b28b1644831229","first_computed_at":"2026-06-26T01:16:18.433570Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-26T01:16:18.433570Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"rOYPxkO38oN0L8Dw87HqPKirE13RCrjk5dxt/bL88G4NQwiQfLVmrI2hutMAnGsaLTsgspyauGb8KSw0EGf8CA==","signature_status":"signed_v1","signed_at":"2026-06-26T01:16:18.433968Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.27313","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a59a5597f6ecedbf1038c28a9e65b8f05f42da94eb4359a46d87662dac43aa63","sha256:02a5b659f85af05bca3bc5b72de98c3428989881b18a35ead738571ee1538ef6"],"state_sha256":"e54511f4e4720463ee70cfc5bf6077df13db9a8ebba466770edbab050f5bdd4d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"InAubTOHEaLxKJHsMWXlkGr7env+OKTAiswl/72UzWQuIMUCBFaN3tGvqtKNjXeswK0ssD2aUbuyxY15slEtBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-01T16:42:25.389799Z","bundle_sha256":"36ddd5c2580c4397e6e6453c347bf73703134965c02e6d2de194ce446e532122"}}