{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5GF5WM52GUCYYH4Y437L4TNHRV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e4fdcced690859587ba3c4125bcd67a36686c87a6013a69926de301d2344e059","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-07-01T16:12:24Z","title_canon_sha256":"c8078414903afdf6e0287bbfa408e620f59f81e1674af8ecb54e68a1cd06057b"},"schema_version":"1.0","source":{"id":"2607.01124","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2607.01124","created_at":"2026-07-02T01:18:29Z"},{"alias_kind":"arxiv_version","alias_value":"2607.01124v1","created_at":"2026-07-02T01:18:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2607.01124","created_at":"2026-07-02T01:18:29Z"},{"alias_kind":"pith_short_12","alias_value":"5GF5WM52GUCY","created_at":"2026-07-02T01:18:29Z"},{"alias_kind":"pith_short_16","alias_value":"5GF5WM52GUCYYH4Y","created_at":"2026-07-02T01:18:29Z"},{"alias_kind":"pith_short_8","alias_value":"5GF5WM52","created_at":"2026-07-02T01:18:29Z"}],"graph_snapshots":[{"event_id":"sha256:d45a1f4c126b6e2b440e6688d8d5b757904a48c749886a1cd2f20cfceb2524b6","target":"graph","created_at":"2026-07-02T01:18:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2607.01124/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Muon has recently emerged as one of the most effective optimizers for training large neural networks, yet its empirical success has been explained from several different perspectives. In this paper, we propose a simple mechanistic interpretation: Muon can be understood as an implicit residual connection during training. Specifically, orthogonalizing the update can sacrifice some immediate gradient fidelity while improving representation preservation for downstream layers. We study this trade-off in controlled linear optimization settings, where Muon can learn representations that are slower to","authors_text":"Hao Huang","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-07-01T16:12:24Z","title":"Muon as a Residual Connection"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2607.01124","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ec7d7d8e5125b364cbd68838b1b91e00e97deebb1e8c90e916f430f4591de02a","target":"record","created_at":"2026-07-02T01:18:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e4fdcced690859587ba3c4125bcd67a36686c87a6013a69926de301d2344e059","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-07-01T16:12:24Z","title_canon_sha256":"c8078414903afdf6e0287bbfa408e620f59f81e1674af8ecb54e68a1cd06057b"},"schema_version":"1.0","source":{"id":"2607.01124","kind":"arxiv","version":1}},"canonical_sha256":"e98bdb33ba35058c1f98e6febe4da78d5c8fc151969e7aea3d1d79ef07b7cbed","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e98bdb33ba35058c1f98e6febe4da78d5c8fc151969e7aea3d1d79ef07b7cbed","first_computed_at":"2026-07-02T01:18:29.774839Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-02T01:18:29.774839Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"MghYnt96LjQr1Eg3Hykob2SIwxtmXNMHt9XYSwLbP4pezcTk9CT/vJRqz1286Z7M6CDqvSKK9qO30AxgblZ6Aw==","signature_status":"signed_v1","signed_at":"2026-07-02T01:18:29.775261Z","signed_message":"canonical_sha256_bytes"},"source_id":"2607.01124","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ec7d7d8e5125b364cbd68838b1b91e00e97deebb1e8c90e916f430f4591de02a","sha256:d45a1f4c126b6e2b440e6688d8d5b757904a48c749886a1cd2f20cfceb2524b6"],"state_sha256":"a17d2b5e044d9147439a82180d2ae6e214195242045bc555efb64d612a8d1f55"}