{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:FAY3G6UTDEDBNILEBQ4YQRD363","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"12a00b40ea8be230edc1dfe81a5ac5d50893374471543873b16d2fbd40954d0a","cross_cats_sorted":["cs.CV"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-16T07:04:13Z","title_canon_sha256":"af79d1f7760c78c95a8149f451f63368c80e09f2306dfca52bbb601a7160abdd"},"schema_version":"1.0","source":{"id":"2606.17598","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.17598","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"arxiv_version","alias_value":"2606.17598v1","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.17598","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_12","alias_value":"FAY3G6UTDEDB","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_16","alias_value":"FAY3G6UTDEDBNILE","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_8","alias_value":"FAY3G6UT","created_at":"2026-06-19T16:10:16Z"}],"graph_snapshots":[{"event_id":"sha256:0cdd22c42842481c86b5191f440bdd28704d97ed73e633692f2840b896543e3d","target":"graph","created_at":"2026-06-19T16:10:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.17598/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Humans naturally leverage diverse sensing modalities to interact with the physical world, while most Vision-Language-Action (VLA) models for robotics rely solely on RGB observations. This limits their ability to perceive physical properties that are difficult or impossible to infer from RGB cameras, such as temperature, sound, or radar response. We present MuseVLA, an adaptive multimodal sensing VLA model that integrates novel sensors as on-demand tools for robotic manipulation. Given a task instruction and visual context, MuseVLA first generates a sensor token and target description that sele","authors_text":"Baining Guo, Chenren Xu, Heyu Guo, Jiaolong Yang, Lin Luo, Qingwen Yang, Qixiu Li, Ruichun Ma, Shiqi Jiang, Xingyuming Liu","cross_cats":["cs.CV"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-16T07:04:13Z","title":"MuseVLA: An Adaptive Multimodal Sensing Vision-Language-Action Model for Robotic Manipulation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.17598","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:cf52df7fc4936636b38f14e84a28039ad3cabb565ec501a1582ce9d41a1cd509","target":"record","created_at":"2026-06-19T16:10:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"12a00b40ea8be230edc1dfe81a5ac5d50893374471543873b16d2fbd40954d0a","cross_cats_sorted":["cs.CV"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-16T07:04:13Z","title_canon_sha256":"af79d1f7760c78c95a8149f451f63368c80e09f2306dfca52bbb601a7160abdd"},"schema_version":"1.0","source":{"id":"2606.17598","kind":"arxiv","version":1}},"canonical_sha256":"2831b37a93190616a1640c3988447bf6d278cc8c0e359ddf562b332ef6419d26","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2831b37a93190616a1640c3988447bf6d278cc8c0e359ddf562b332ef6419d26","first_computed_at":"2026-06-19T16:10:16.954715Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:10:16.954715Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"9w6zsu4js9Ny/1S/PQEo76JJcVqXOtxJuV8BWuk7sd3ENAOs6jc1lcl08wL9XTfU0CwaxmeASrzc25kkywyuAg==","signature_status":"signed_v1","signed_at":"2026-06-19T16:10:16.955064Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.17598","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:cf52df7fc4936636b38f14e84a28039ad3cabb565ec501a1582ce9d41a1cd509","sha256:0cdd22c42842481c86b5191f440bdd28704d97ed73e633692f2840b896543e3d"],"state_sha256":"9fbf4f0472e65acc265d4fe99c649d21ff72bf157c2a7b960890bdc1c71e7f5c"}