{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:5CN7UH6RWEFHR4JG2KGUCC33S6","short_pith_number":"pith:5CN7UH6R","schema_version":"1.0","canonical_sha256":"e89bfa1fd1b10a78f126d28d410b7b97984ea2315faea1a73f4afb3cfbe4ac0b","source":{"kind":"arxiv","id":"2605.28585","version":1},"attestation_state":"computed","paper":{"title":"Outer-Momentum Restarting in High-Dimensional Two-Phase Optimization","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Allan Ma, Anna Choromanska, Kristi Topollai, Sui Jiet Tay, Tolga Dimlioglu","submitted_at":"2026-05-27T15:09:02Z","abstract_excerpt":"Communication-efficient distributed optimizers such as DiLoCo reduce synchronization costs by letting workers perform many local updates before aggregating their progress with an outer momentum optimizer. Recent theory suggests that the outer optimizer acts on an effective spectrum induced by the inner optimization loop, and that the choice of outer momentum controls how progress from local updates is accumulated across communication rounds. We study periodic restarting of the outer momentum as a simple complementary mechanism for controlling this outer memory. In a linearized squared-loss mod"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.28585","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-27T15:09:02Z","cross_cats_sorted":[],"title_canon_sha256":"6ee3bede62074e9ea86eaf995b98f920c176698eb3cf7c3f664ec284c29b66f6","abstract_canon_sha256":"1aaad03fe882a0e4772cc72bd30c167d939c4d83b7ec2d8d7bbe448d0e4ca2dc"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T02:04:57.108686Z","signature_b64":"cpVRTc6tJtPQnyxJIyhVVd2csxxq6N9Ec0+IXzN9UX9abhPehYpbinRR5p4sU8poenPUcp4cHL/EJdP0TTbGCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e89bfa1fd1b10a78f126d28d410b7b97984ea2315faea1a73f4afb3cfbe4ac0b","last_reissued_at":"2026-05-28T02:04:57.108272Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T02:04:57.108272Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Outer-Momentum Restarting in High-Dimensional Two-Phase Optimization","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Allan Ma, Anna Choromanska, Kristi Topollai, Sui Jiet Tay, Tolga Dimlioglu","submitted_at":"2026-05-27T15:09:02Z","abstract_excerpt":"Communication-efficient distributed optimizers such as DiLoCo reduce synchronization costs by letting workers perform many local updates before aggregating their progress with an outer momentum optimizer. Recent theory suggests that the outer optimizer acts on an effective spectrum induced by the inner optimization loop, and that the choice of outer momentum controls how progress from local updates is accumulated across communication rounds. We study periodic restarting of the outer momentum as a simple complementary mechanism for controlling this outer memory. In a linearized squared-loss mod"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28585","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.28585/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.28585","created_at":"2026-05-28T02:04:57.108334+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.28585v1","created_at":"2026-05-28T02:04:57.108334+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28585","created_at":"2026-05-28T02:04:57.108334+00:00"},{"alias_kind":"pith_short_12","alias_value":"5CN7UH6RWEFH","created_at":"2026-05-28T02:04:57.108334+00:00"},{"alias_kind":"pith_short_16","alias_value":"5CN7UH6RWEFHR4JG","created_at":"2026-05-28T02:04:57.108334+00:00"},{"alias_kind":"pith_short_8","alias_value":"5CN7UH6R","created_at":"2026-05-28T02:04:57.108334+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6","json":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6.json","graph_json":"https://pith.science/api/pith-number/5CN7UH6RWEFHR4JG2KGUCC33S6/graph.json","events_json":"https://pith.science/api/pith-number/5CN7UH6RWEFHR4JG2KGUCC33S6/events.json","paper":"https://pith.science/paper/5CN7UH6R"},"agent_actions":{"view_html":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6","download_json":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6.json","view_paper":"https://pith.science/paper/5CN7UH6R","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.28585&json=true","fetch_graph":"https://pith.science/api/pith-number/5CN7UH6RWEFHR4JG2KGUCC33S6/graph.json","fetch_events":"https://pith.science/api/pith-number/5CN7UH6RWEFHR4JG2KGUCC33S6/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6/action/timestamp_anchor","attest_storage":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6/action/storage_attestation","attest_author":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6/action/author_attestation","sign_citation":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6/action/citation_signature","submit_replication":"https://pith.science/pith/5CN7UH6RWEFHR4JG2KGUCC33S6/action/replication_record"}},"created_at":"2026-05-28T02:04:57.108334+00:00","updated_at":"2026-05-28T02:04:57.108334+00:00"}