{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:4KGQ6XSWDCTQWUFQ7ZRS6XEGGI","short_pith_number":"pith:4KGQ6XSW","schema_version":"1.0","canonical_sha256":"e28d0f5e5618a70b50b0fe632f5c8632332e0db0f55892020bdc3fe39de865d4","source":{"kind":"arxiv","id":"2606.27715","version":1},"attestation_state":"computed","paper":{"title":"Aurora: A Leverage-Aware Spectral Optimizer","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Alec Dewulf, Ashley Zhang, Ben Keigwin, Dhruv Pai, Li Yang","submitted_at":"2026-06-26T04:47:37Z","abstract_excerpt":"We show that for tall matrix parameters, like projection matrices in the MLP layers, the Muon update can have row norms that are arbitrarily non-uniform. This can lead to a self-reinforcing feedback loop whereby neurons receive persistently small updates and eventually do not contribute meaningfully to network outputs. This problem is effectively mitigated by an additional row normalization step, but current methods do this in a way that moves the Muon update geometry away from the polar factor of the momentum matrix, which we find is undesirable. We propose Aurora, an optimizer that enforces "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.27715","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-26T04:47:37Z","cross_cats_sorted":[],"title_canon_sha256":"778a6021b2ed9d1ee2d1da57209f16a7b62184d489b6891792424e44d99422f0","abstract_canon_sha256":"d4a0a2e11a1c6f95ae0fa7d524abf9870199021544e416a0a5ef5820933bd790"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-29T01:14:46.239735Z","signature_b64":"hZ/KUzYC2fcy1cHpEIBJl6DUVBYlIjRhVn/9dcBBzM8IBYChVsBxPjlkbsj9RnmxithDxtgz7d6l8U/w2FxbBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e28d0f5e5618a70b50b0fe632f5c8632332e0db0f55892020bdc3fe39de865d4","last_reissued_at":"2026-06-29T01:14:46.239347Z","signature_status":"signed_v1","first_computed_at":"2026-06-29T01:14:46.239347Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Aurora: A Leverage-Aware Spectral Optimizer","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Alec Dewulf, Ashley Zhang, Ben Keigwin, Dhruv Pai, Li Yang","submitted_at":"2026-06-26T04:47:37Z","abstract_excerpt":"We show that for tall matrix parameters, like projection matrices in the MLP layers, the Muon update can have row norms that are arbitrarily non-uniform. This can lead to a self-reinforcing feedback loop whereby neurons receive persistently small updates and eventually do not contribute meaningfully to network outputs. This problem is effectively mitigated by an additional row normalization step, but current methods do this in a way that moves the Muon update geometry away from the polar factor of the momentum matrix, which we find is undesirable. We propose Aurora, an optimizer that enforces "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.27715","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.27715/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.27715","created_at":"2026-06-29T01:14:46.239400+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.27715v1","created_at":"2026-06-29T01:14:46.239400+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.27715","created_at":"2026-06-29T01:14:46.239400+00:00"},{"alias_kind":"pith_short_12","alias_value":"4KGQ6XSWDCTQ","created_at":"2026-06-29T01:14:46.239400+00:00"},{"alias_kind":"pith_short_16","alias_value":"4KGQ6XSWDCTQWUFQ","created_at":"2026-06-29T01:14:46.239400+00:00"},{"alias_kind":"pith_short_8","alias_value":"4KGQ6XSW","created_at":"2026-06-29T01:14:46.239400+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI","json":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI.json","graph_json":"https://pith.science/api/pith-number/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/graph.json","events_json":"https://pith.science/api/pith-number/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/events.json","paper":"https://pith.science/paper/4KGQ6XSW"},"agent_actions":{"view_html":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI","download_json":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI.json","view_paper":"https://pith.science/paper/4KGQ6XSW","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.27715&json=true","fetch_graph":"https://pith.science/api/pith-number/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/graph.json","fetch_events":"https://pith.science/api/pith-number/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/action/timestamp_anchor","attest_storage":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/action/storage_attestation","attest_author":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/action/author_attestation","sign_citation":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/action/citation_signature","submit_replication":"https://pith.science/pith/4KGQ6XSWDCTQWUFQ7ZRS6XEGGI/action/replication_record"}},"created_at":"2026-06-29T01:14:46.239400+00:00","updated_at":"2026-06-29T01:14:46.239400+00:00"}