{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:IPUKQ7MFSRG7C7BBSXWVWN6SZL","short_pith_number":"pith:IPUKQ7MF","canonical_record":{"source":{"id":"2605.20756","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-20T05:54:24Z","cross_cats_sorted":["cs.AI","math.OC","stat.ML"],"title_canon_sha256":"250eb6b4c8673dd131d5808b0e4d1d8f8b79b3727a80d295f55ea0c20c44dd57","abstract_canon_sha256":"ccbe21564420360e0a9b798548aa8af4993184b5de5611a3f8b19524ba8d4799"},"schema_version":"1.0"},"canonical_sha256":"43e8a87d85944df17c2195ed5b37d2cad97fb1699dc81de679ade54892a43dce","source":{"kind":"arxiv","id":"2605.20756","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.20756","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"arxiv_version","alias_value":"2605.20756v1","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.20756","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"pith_short_12","alias_value":"IPUKQ7MFSRG7","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"pith_short_16","alias_value":"IPUKQ7MFSRG7C7BB","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"pith_short_8","alias_value":"IPUKQ7MF","created_at":"2026-05-21T01:04:52Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:IPUKQ7MFSRG7C7BBSXWVWN6SZL","target":"record","payload":{"canonical_record":{"source":{"id":"2605.20756","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-20T05:54:24Z","cross_cats_sorted":["cs.AI","math.OC","stat.ML"],"title_canon_sha256":"250eb6b4c8673dd131d5808b0e4d1d8f8b79b3727a80d295f55ea0c20c44dd57","abstract_canon_sha256":"ccbe21564420360e0a9b798548aa8af4993184b5de5611a3f8b19524ba8d4799"},"schema_version":"1.0"},"canonical_sha256":"43e8a87d85944df17c2195ed5b37d2cad97fb1699dc81de679ade54892a43dce","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-21T01:04:52.691291Z","signature_b64":"VaQSj4wOJIcbOYmXgZCT1HVwEykFldrgN4mobsC2rWe0NexZKvgDmLEaEQfi25vhlbldQf1V5Vvjmt7GLL2aDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"43e8a87d85944df17c2195ed5b37d2cad97fb1699dc81de679ade54892a43dce","last_reissued_at":"2026-05-21T01:04:52.690570Z","signature_status":"signed_v1","first_computed_at":"2026-05-21T01:04:52.690570Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.20756","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T01:04:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AjgQ7kZ0H6w8TU6n+17ZmwV3bndbKjzZgW0qpwKc8FmJ91+ZPj5sAcdyid7n89YRC9URllDkPyY+jj5CleZvCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T09:05:34.496234Z"},"content_sha256":"ec4b8f952d5ea82a60f9835647c3d78fdfce9d0a43d6e63c90849a25fb9f7777","schema_version":"1.0","event_id":"sha256:ec4b8f952d5ea82a60f9835647c3d78fdfce9d0a43d6e63c90849a25fb9f7777"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:IPUKQ7MFSRG7C7BBSXWVWN6SZL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Correcting Stochastic Update Bias in Preconditioned Language Model Optimizers","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","math.OC","stat.ML"],"primary_cat":"cs.LG","authors_text":"Ash Lewis, Dhruv Atreja, George Hurn-Maloney, Henrijs Princis, Henry Fawcett, Julia White, Kelton Zhang, Matthew Thomas, Nikhil Nayak, Urchade Zaratiana","submitted_at":"2026-05-20T05:54:24Z","abstract_excerpt":"Preconditioned optimizers are central to language model training, but their stochastic update rules are usually treated as direct approximations to population preconditioned descent. We show that this view misses two finite-sample biases. First, the gradient and preconditioner are typically estimated from the same minibatch, introducing gradient--preconditioner coupling bias. Second, even when the preconditioner estimate is unbiased, its inverse or inverse-root is generally biased because inversion is nonlinear. We propose a single-batch bias-correction framework that addresses both effects: c"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.20756","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.20756/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-21T01:04:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"h0P/mPXsQl9a27vfkitHvo0QRiJ7kAOknev2n5rJSXGDt4s5ozLnUl1S/CRd9QBq1hMWc4OpOT219r0XEvJSCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T09:05:34.497041Z"},"content_sha256":"097e5a58f235c0e22da7029cc519a3fd9568fe294ded163c8859650decacb9b0","schema_version":"1.0","event_id":"sha256:097e5a58f235c0e22da7029cc519a3fd9568fe294ded163c8859650decacb9b0"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL/bundle.json","state_url":"https://pith.science/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-24T09:05:34Z","links":{"resolver":"https://pith.science/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL","bundle":"https://pith.science/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL/bundle.json","state":"https://pith.science/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/IPUKQ7MFSRG7C7BBSXWVWN6SZL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:IPUKQ7MFSRG7C7BBSXWVWN6SZL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ccbe21564420360e0a9b798548aa8af4993184b5de5611a3f8b19524ba8d4799","cross_cats_sorted":["cs.AI","math.OC","stat.ML"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-20T05:54:24Z","title_canon_sha256":"250eb6b4c8673dd131d5808b0e4d1d8f8b79b3727a80d295f55ea0c20c44dd57"},"schema_version":"1.0","source":{"id":"2605.20756","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.20756","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"arxiv_version","alias_value":"2605.20756v1","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.20756","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"pith_short_12","alias_value":"IPUKQ7MFSRG7","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"pith_short_16","alias_value":"IPUKQ7MFSRG7C7BB","created_at":"2026-05-21T01:04:52Z"},{"alias_kind":"pith_short_8","alias_value":"IPUKQ7MF","created_at":"2026-05-21T01:04:52Z"}],"graph_snapshots":[{"event_id":"sha256:097e5a58f235c0e22da7029cc519a3fd9568fe294ded163c8859650decacb9b0","target":"graph","created_at":"2026-05-21T01:04:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.20756/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Preconditioned optimizers are central to language model training, but their stochastic update rules are usually treated as direct approximations to population preconditioned descent. We show that this view misses two finite-sample biases. First, the gradient and preconditioner are typically estimated from the same minibatch, introducing gradient--preconditioner coupling bias. Second, even when the preconditioner estimate is unbiased, its inverse or inverse-root is generally biased because inversion is nonlinear. We propose a single-batch bias-correction framework that addresses both effects: c","authors_text":"Ash Lewis, Dhruv Atreja, George Hurn-Maloney, Henrijs Princis, Henry Fawcett, Julia White, Kelton Zhang, Matthew Thomas, Nikhil Nayak, Urchade Zaratiana","cross_cats":["cs.AI","math.OC","stat.ML"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-20T05:54:24Z","title":"Correcting Stochastic Update Bias in Preconditioned Language Model Optimizers"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.20756","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ec4b8f952d5ea82a60f9835647c3d78fdfce9d0a43d6e63c90849a25fb9f7777","target":"record","created_at":"2026-05-21T01:04:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ccbe21564420360e0a9b798548aa8af4993184b5de5611a3f8b19524ba8d4799","cross_cats_sorted":["cs.AI","math.OC","stat.ML"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-20T05:54:24Z","title_canon_sha256":"250eb6b4c8673dd131d5808b0e4d1d8f8b79b3727a80d295f55ea0c20c44dd57"},"schema_version":"1.0","source":{"id":"2605.20756","kind":"arxiv","version":1}},"canonical_sha256":"43e8a87d85944df17c2195ed5b37d2cad97fb1699dc81de679ade54892a43dce","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"43e8a87d85944df17c2195ed5b37d2cad97fb1699dc81de679ade54892a43dce","first_computed_at":"2026-05-21T01:04:52.690570Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-21T01:04:52.690570Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"VaQSj4wOJIcbOYmXgZCT1HVwEykFldrgN4mobsC2rWe0NexZKvgDmLEaEQfi25vhlbldQf1V5Vvjmt7GLL2aDw==","signature_status":"signed_v1","signed_at":"2026-05-21T01:04:52.691291Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.20756","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ec4b8f952d5ea82a60f9835647c3d78fdfce9d0a43d6e63c90849a25fb9f7777","sha256:097e5a58f235c0e22da7029cc519a3fd9568fe294ded163c8859650decacb9b0"],"state_sha256":"e3eff90eb61342980771e11b1e4f77e6db86216e515967f29465af3368b93434"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OTLYjPpLTwqo7+GdhG/ugoeDRfQn90C5JuUyPlsWgT4rQX3qhvfPojHVvrj/yyxOr6Bf3jhTUcW97wJJKqLbBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-24T09:05:34.501177Z","bundle_sha256":"63b5790a5785dc8126e8f13f978fa58b19781f2f04ed1ab4e0b9b5df7080f074"}}