{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:GJEAEQCEE374P3IC4BTDRBSLNK","short_pith_number":"pith:GJEAEQCE","canonical_record":{"source":{"id":"2606.23364","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T14:00:26Z","cross_cats_sorted":["math.DS","math.OC"],"title_canon_sha256":"bac2d811a61234ecca067f04942475edbe2de80da692f92e0d8c8dfd49969c90","abstract_canon_sha256":"0a52e346b029e678cf287c1d7843292de0ff8e3567e12b79991a4e923d82cf1d"},"schema_version":"1.0"},"canonical_sha256":"324802404426ffc7ed02e06638864b6aafe0b312c702b4bc4193f080feee8860","source":{"kind":"arxiv","id":"2606.23364","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.23364","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"arxiv_version","alias_value":"2606.23364v1","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.23364","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"pith_short_12","alias_value":"GJEAEQCEE374","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"pith_short_16","alias_value":"GJEAEQCEE374P3IC","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"pith_short_8","alias_value":"GJEAEQCE","created_at":"2026-06-23T03:14:17Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:GJEAEQCEE374P3IC4BTDRBSLNK","target":"record","payload":{"canonical_record":{"source":{"id":"2606.23364","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T14:00:26Z","cross_cats_sorted":["math.DS","math.OC"],"title_canon_sha256":"bac2d811a61234ecca067f04942475edbe2de80da692f92e0d8c8dfd49969c90","abstract_canon_sha256":"0a52e346b029e678cf287c1d7843292de0ff8e3567e12b79991a4e923d82cf1d"},"schema_version":"1.0"},"canonical_sha256":"324802404426ffc7ed02e06638864b6aafe0b312c702b4bc4193f080feee8860","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-23T03:14:17.877168Z","signature_b64":"NY7UtFqaanVSZC9mNJmL1A0hFDAgDrr7fvpYBVO+B6RW2XqX4NfCvVroFB2o05P7aXma/E+UT9clz0IPfhdeDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"324802404426ffc7ed02e06638864b6aafe0b312c702b4bc4193f080feee8860","last_reissued_at":"2026-06-23T03:14:17.876777Z","signature_status":"signed_v1","first_computed_at":"2026-06-23T03:14:17.876777Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.23364","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-23T03:14:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1p2EL90Vc3b4RyU0C0+6Fn4sx3buMWXL6SmQTgeJRpgxNSprvPmmgxDRvXA882vDMB4TAmWCLL/Wpiu4/4lPCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T11:26:24.849500Z"},"content_sha256":"6667e30981a9bca8cd9e1f9c63f4d7c296e76b7c417604ef1d199dc87d6064e5","schema_version":"1.0","event_id":"sha256:6667e30981a9bca8cd9e1f9c63f4d7c296e76b7c417604ef1d199dc87d6064e5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:GJEAEQCEE374P3IC4BTDRBSLNK","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Convergence of Gradient Descent for General Neural Network Architectures Beyond the NTK Regime","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["math.DS","math.OC"],"primary_cat":"cs.LG","authors_text":"Yuqing Wang","submitted_at":"2026-06-22T14:00:26Z","abstract_excerpt":"Training dynamics is central to understanding neural networks, yet its theoretical analysis remains difficult even for simple architectures and becomes substantially more challenging for general modern architectures. In this paper, we propose a convergence framework for analyzing gradient descent (GD) dynamics under a broad family of neural network architectures and datasets beyond the neural tangent kernel (NTK) regime. The framework is formulated at the level of network blocks and covers architectures including pre-normalized multi-layer transformers. More precisely, under mild assumptions, "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.23364","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.23364/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-23T03:14:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3RwliUkVpMajnj2KDnCCh5axUxnKlF6mQeys0H40xnUzI0oqCgcudAchcrLut/qJVjHisSmRoR9LH4kA+80PCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T11:26:24.849893Z"},"content_sha256":"14b7feef50455ea6907b8b54aa7861d08f506320784922915324f4d08f1034d2","schema_version":"1.0","event_id":"sha256:14b7feef50455ea6907b8b54aa7861d08f506320784922915324f4d08f1034d2"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/GJEAEQCEE374P3IC4BTDRBSLNK/bundle.json","state_url":"https://pith.science/pith/GJEAEQCEE374P3IC4BTDRBSLNK/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/GJEAEQCEE374P3IC4BTDRBSLNK/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T11:26:24Z","links":{"resolver":"https://pith.science/pith/GJEAEQCEE374P3IC4BTDRBSLNK","bundle":"https://pith.science/pith/GJEAEQCEE374P3IC4BTDRBSLNK/bundle.json","state":"https://pith.science/pith/GJEAEQCEE374P3IC4BTDRBSLNK/state.json","well_known_bundle":"https://pith.science/.well-known/pith/GJEAEQCEE374P3IC4BTDRBSLNK/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:GJEAEQCEE374P3IC4BTDRBSLNK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0a52e346b029e678cf287c1d7843292de0ff8e3567e12b79991a4e923d82cf1d","cross_cats_sorted":["math.DS","math.OC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T14:00:26Z","title_canon_sha256":"bac2d811a61234ecca067f04942475edbe2de80da692f92e0d8c8dfd49969c90"},"schema_version":"1.0","source":{"id":"2606.23364","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.23364","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"arxiv_version","alias_value":"2606.23364v1","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.23364","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"pith_short_12","alias_value":"GJEAEQCEE374","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"pith_short_16","alias_value":"GJEAEQCEE374P3IC","created_at":"2026-06-23T03:14:17Z"},{"alias_kind":"pith_short_8","alias_value":"GJEAEQCE","created_at":"2026-06-23T03:14:17Z"}],"graph_snapshots":[{"event_id":"sha256:14b7feef50455ea6907b8b54aa7861d08f506320784922915324f4d08f1034d2","target":"graph","created_at":"2026-06-23T03:14:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.23364/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Training dynamics is central to understanding neural networks, yet its theoretical analysis remains difficult even for simple architectures and becomes substantially more challenging for general modern architectures. In this paper, we propose a convergence framework for analyzing gradient descent (GD) dynamics under a broad family of neural network architectures and datasets beyond the neural tangent kernel (NTK) regime. The framework is formulated at the level of network blocks and covers architectures including pre-normalized multi-layer transformers. More precisely, under mild assumptions, ","authors_text":"Yuqing Wang","cross_cats":["math.DS","math.OC"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T14:00:26Z","title":"Convergence of Gradient Descent for General Neural Network Architectures Beyond the NTK Regime"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.23364","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6667e30981a9bca8cd9e1f9c63f4d7c296e76b7c417604ef1d199dc87d6064e5","target":"record","created_at":"2026-06-23T03:14:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0a52e346b029e678cf287c1d7843292de0ff8e3567e12b79991a4e923d82cf1d","cross_cats_sorted":["math.DS","math.OC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T14:00:26Z","title_canon_sha256":"bac2d811a61234ecca067f04942475edbe2de80da692f92e0d8c8dfd49969c90"},"schema_version":"1.0","source":{"id":"2606.23364","kind":"arxiv","version":1}},"canonical_sha256":"324802404426ffc7ed02e06638864b6aafe0b312c702b4bc4193f080feee8860","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"324802404426ffc7ed02e06638864b6aafe0b312c702b4bc4193f080feee8860","first_computed_at":"2026-06-23T03:14:17.876777Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-23T03:14:17.876777Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"NY7UtFqaanVSZC9mNJmL1A0hFDAgDrr7fvpYBVO+B6RW2XqX4NfCvVroFB2o05P7aXma/E+UT9clz0IPfhdeDw==","signature_status":"signed_v1","signed_at":"2026-06-23T03:14:17.877168Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.23364","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6667e30981a9bca8cd9e1f9c63f4d7c296e76b7c417604ef1d199dc87d6064e5","sha256:14b7feef50455ea6907b8b54aa7861d08f506320784922915324f4d08f1034d2"],"state_sha256":"3cc2baab4cc9465c1e70b0ba0e6d6abdf3dfd11af221279b81484bdd6974aba3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vUI2ekWfzHrrtzTQcuNcOR8c7HW6UdbpiGmA/LzJSbzLTkVqfJJAzkn+FyOCEvfy1N4nvsRen3SKg2RLJEnZAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T11:26:24.851844Z","bundle_sha256":"e4033b574a3e53396db136ed131f497ba76614b7d55a23fc7d8001fea65a94cc"}}