{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:LAVMIUQXXDOP27ZZVIZYRC2A3Q","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ae075212a32f657773cffa41cf4aed9c16e0ea70ab1038d335169a059bbfd3d9","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-11T12:30:05Z","title_canon_sha256":"6b58b31cb6c61a3e655961f7d7b6d0a074699b03ac08137df1518adcc7395a56"},"schema_version":"1.0","source":{"id":"2606.13276","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.13276","created_at":"2026-06-12T01:09:50Z"},{"alias_kind":"arxiv_version","alias_value":"2606.13276v1","created_at":"2026-06-12T01:09:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.13276","created_at":"2026-06-12T01:09:50Z"},{"alias_kind":"pith_short_12","alias_value":"LAVMIUQXXDOP","created_at":"2026-06-12T01:09:50Z"},{"alias_kind":"pith_short_16","alias_value":"LAVMIUQXXDOP27ZZ","created_at":"2026-06-12T01:09:50Z"},{"alias_kind":"pith_short_8","alias_value":"LAVMIUQX","created_at":"2026-06-12T01:09:50Z"}],"graph_snapshots":[{"event_id":"sha256:b8bd847b2ea99d8c4819a62efc9b4d6d70fe4a421d8729155a3de41d39adc7db","target":"graph","created_at":"2026-06-12T01:09:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.13276/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Weight-space geometry plays a central role in neural network optimization, yet manifold constraints are often applied uniformly across all weight matrices. In this work, we ask whether different transformer modules prefer different manifold geometries. We study Manifold Muon for GPT-2 pretraining and compare layer-wise assignments of Stiefel and DGram constraints across attention and MLP blocks. Our results show a clear asymmetry: constraining attention layers with Stiefel geometry while assigning DGram geometry to MLP layers gives the best performance among the tested configurations, whereas ","authors_text":"Kirato Yoshihara","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-11T12:30:05Z","title":"Different Layers, Different Manifolds: Module-Wise Weight-Space Geometry in Transformer Optimization"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.13276","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ddfe038f9641f3811430c97f170a1192af91ba988a13c06bca764f4266ab4b57","target":"record","created_at":"2026-06-12T01:09:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ae075212a32f657773cffa41cf4aed9c16e0ea70ab1038d335169a059bbfd3d9","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-11T12:30:05Z","title_canon_sha256":"6b58b31cb6c61a3e655961f7d7b6d0a074699b03ac08137df1518adcc7395a56"},"schema_version":"1.0","source":{"id":"2606.13276","kind":"arxiv","version":1}},"canonical_sha256":"582ac45217b8dcfd7f39aa33888b40dc38e7a3a8ef3444d96961918b6df4ec45","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"582ac45217b8dcfd7f39aa33888b40dc38e7a3a8ef3444d96961918b6df4ec45","first_computed_at":"2026-06-12T01:09:50.102479Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-12T01:09:50.102479Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"B62twE6nsRmvVdzyIhKbvU+dL6Sspx4/YRH/l6rylwHunk6L9YO/d+GiSGhUKNJycILHSyPaQAWu2tI43ehRDw==","signature_status":"signed_v1","signed_at":"2026-06-12T01:09:50.103313Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.13276","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ddfe038f9641f3811430c97f170a1192af91ba988a13c06bca764f4266ab4b57","sha256:b8bd847b2ea99d8c4819a62efc9b4d6d70fe4a421d8729155a3de41d39adc7db"],"state_sha256":"a72898abc6d2622bfa2c4ffa3e79c5e7ccc72169e6e4cf1f531e4484695d6892"}