{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:JF3WIZMKMFXYIL5AXZ6S6V3JCV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5d4e93d302d9f51ed3ae9a824f61a01d7a6b6335eea2c205f085fcda5bcb6bdf","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-18T10:40:55Z","title_canon_sha256":"82f675be3dd2bfc43c65789d5829a4f636972bb2231be9d586f85642fbbc23fb"},"schema_version":"1.0","source":{"id":"2606.20068","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.20068","created_at":"2026-06-19T16:13:02Z"},{"alias_kind":"arxiv_version","alias_value":"2606.20068v1","created_at":"2026-06-19T16:13:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.20068","created_at":"2026-06-19T16:13:02Z"},{"alias_kind":"pith_short_12","alias_value":"JF3WIZMKMFXY","created_at":"2026-06-19T16:13:02Z"},{"alias_kind":"pith_short_16","alias_value":"JF3WIZMKMFXYIL5A","created_at":"2026-06-19T16:13:02Z"},{"alias_kind":"pith_short_8","alias_value":"JF3WIZMK","created_at":"2026-06-19T16:13:02Z"}],"graph_snapshots":[{"event_id":"sha256:0639289e7c55c17cf32e90ba59f2861361b3f3ae3f7517e3fc969b4f1e535dfc","target":"graph","created_at":"2026-06-19T16:13:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.20068/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While reinforcement learning from verifiable rewards (RLVR) typically has relied on a single binary verification signal, symbolic proof assistants in formal reasoning offer rich, fine-grained structured feedback. This gap between structured processes and unstructured rewards highlights the importance of feedback that is both dense and sound. In this work, we demonstrate that the Lean proof assistant itself can serve as a symbolic process oracle, supplying both outcome-level and fine-grained tactic-level verified feedback during training. Proof attempts are parsed into tactic sequences, and Lea","authors_text":"Minsu Kim, Se-Young Yun","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-18T10:40:55Z","title":"Process-Verified Reinforcement Learning for Theorem Proving via Lean"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.20068","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:709f823422b1e89c106708d55d3ecf7f78d9b70fdb24ae088bd73b199763f8c3","target":"record","created_at":"2026-06-19T16:13:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5d4e93d302d9f51ed3ae9a824f61a01d7a6b6335eea2c205f085fcda5bcb6bdf","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-18T10:40:55Z","title_canon_sha256":"82f675be3dd2bfc43c65789d5829a4f636972bb2231be9d586f85642fbbc23fb"},"schema_version":"1.0","source":{"id":"2606.20068","kind":"arxiv","version":1}},"canonical_sha256":"497764658a616f842fa0be7d2f576915668c30dc7d5836d3aacdedf31aae9a3f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"497764658a616f842fa0be7d2f576915668c30dc7d5836d3aacdedf31aae9a3f","first_computed_at":"2026-06-19T16:13:02.026918Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:13:02.026918Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"hT5tkZC8U3yfL1n3kzorcPRMPmpc8XHoTXdQPoEHdyT9vZ+a6Fpw8LKqWUB+kD7EKxQMruRrE+7xY+NvRj60CQ==","signature_status":"signed_v1","signed_at":"2026-06-19T16:13:02.027287Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.20068","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:709f823422b1e89c106708d55d3ecf7f78d9b70fdb24ae088bd73b199763f8c3","sha256:0639289e7c55c17cf32e90ba59f2861361b3f3ae3f7517e3fc969b4f1e535dfc"],"state_sha256":"be4b1f768fcdbd3a4804e61ec17e08ba1faf72a32cf86a2814b3db434b06c29a"}