{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:NYLWGCIX6KUDIAKDBRMBW5CXYA","short_pith_number":"pith:NYLWGCIX","canonical_record":{"source":{"id":"2605.28388","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T12:25:57Z","cross_cats_sorted":[],"title_canon_sha256":"a171ea4e8538f4e0c39ebfb85e107b69668b0719a288b8365497839de571b993","abstract_canon_sha256":"034a83825d0962298fb22be8375c79501a808ddc0cd29f602d637d7a534aa26b"},"schema_version":"1.0"},"canonical_sha256":"6e17630917f2a83401430c581b7457c004c7ae8447f0590e270eb8e55584553d","source":{"kind":"arxiv","id":"2605.28388","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.28388","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"arxiv_version","alias_value":"2605.28388v1","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28388","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"pith_short_12","alias_value":"NYLWGCIX6KUD","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"pith_short_16","alias_value":"NYLWGCIX6KUDIAKD","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"pith_short_8","alias_value":"NYLWGCIX","created_at":"2026-05-28T01:05:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:NYLWGCIX6KUDIAKDBRMBW5CXYA","target":"record","payload":{"canonical_record":{"source":{"id":"2605.28388","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T12:25:57Z","cross_cats_sorted":[],"title_canon_sha256":"a171ea4e8538f4e0c39ebfb85e107b69668b0719a288b8365497839de571b993","abstract_canon_sha256":"034a83825d0962298fb22be8375c79501a808ddc0cd29f602d637d7a534aa26b"},"schema_version":"1.0"},"canonical_sha256":"6e17630917f2a83401430c581b7457c004c7ae8447f0590e270eb8e55584553d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T01:05:16.806932Z","signature_b64":"vjsW+EQ7D10624BxZZwYSFhlGerbEmphYO7FBqN+ULu01PDUnDBVyrHcmiC6zyvjn5BnTJ/pXGTPXHZFcXTFAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6e17630917f2a83401430c581b7457c004c7ae8447f0590e270eb8e55584553d","last_reissued_at":"2026-05-28T01:05:16.806529Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T01:05:16.806529Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.28388","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-28T01:05:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"A8/2BzpUGfB4KWncXyeGUvlKNK8lUhZdeZUYtApWPNS809l9mkv7fRF9+Jws/cJ/cJzyJfYK5bjBD09AhjetBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T23:37:20.224063Z"},"content_sha256":"963aa421f8c44282da6d77f7d5a4ac084eb300a909884357ffc1a2998bf57c17","schema_version":"1.0","event_id":"sha256:963aa421f8c44282da6d77f7d5a4ac084eb300a909884357ffc1a2998bf57c17"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:NYLWGCIX6KUDIAKDBRMBW5CXYA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Mechanistically Interpreting the Role of Sample Difficulty in RLVR for LLMs","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Jiajun Zhang, Weiwei Xing, Xiaohui Gao, Yue Cheng, Zhanxing Zhu, Zheng Wang","submitted_at":"2026-05-27T12:25:57Z","abstract_excerpt":"Reinforcement Learning with Verifiable Reward (RLVR) is empirically shown to notably enhance the reasoning performance of large language models (LLMs), particularly in mathematics and programming. However, the mechanistic role of Sample Difficulty in RLVR remains poorly understood. In this paper, we investigate RLVR through the lens of difficulty-wise and one-sample analysis. We find that sample difficulty has a non-monotonic effect on RLVR: easy and medium-difficulty problems yield the strongest and most stable reasoning improvements, whereas overly hard problems often provide weak learning s"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28388","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.28388/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-28T01:05:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"A6kCW61gqQM5jQRJ2bdLTB04uftgtWGnhBUgVam0B0JUPvAecz6QqqZ/7RFlrjlHGQDTqVhDVE2q2D87TeBmDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T23:37:20.224445Z"},"content_sha256":"87af40c77f93652bfa59ebef54d12971e9e7a48fe4d2d4299ef6fbc25c0f9ab8","schema_version":"1.0","event_id":"sha256:87af40c77f93652bfa59ebef54d12971e9e7a48fe4d2d4299ef6fbc25c0f9ab8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA/bundle.json","state_url":"https://pith.science/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T23:37:20Z","links":{"resolver":"https://pith.science/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA","bundle":"https://pith.science/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA/bundle.json","state":"https://pith.science/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NYLWGCIX6KUDIAKDBRMBW5CXYA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:NYLWGCIX6KUDIAKDBRMBW5CXYA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"034a83825d0962298fb22be8375c79501a808ddc0cd29f602d637d7a534aa26b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T12:25:57Z","title_canon_sha256":"a171ea4e8538f4e0c39ebfb85e107b69668b0719a288b8365497839de571b993"},"schema_version":"1.0","source":{"id":"2605.28388","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.28388","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"arxiv_version","alias_value":"2605.28388v1","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28388","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"pith_short_12","alias_value":"NYLWGCIX6KUD","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"pith_short_16","alias_value":"NYLWGCIX6KUDIAKD","created_at":"2026-05-28T01:05:16Z"},{"alias_kind":"pith_short_8","alias_value":"NYLWGCIX","created_at":"2026-05-28T01:05:16Z"}],"graph_snapshots":[{"event_id":"sha256:87af40c77f93652bfa59ebef54d12971e9e7a48fe4d2d4299ef6fbc25c0f9ab8","target":"graph","created_at":"2026-05-28T01:05:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.28388/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reinforcement Learning with Verifiable Reward (RLVR) is empirically shown to notably enhance the reasoning performance of large language models (LLMs), particularly in mathematics and programming. However, the mechanistic role of Sample Difficulty in RLVR remains poorly understood. In this paper, we investigate RLVR through the lens of difficulty-wise and one-sample analysis. We find that sample difficulty has a non-monotonic effect on RLVR: easy and medium-difficulty problems yield the strongest and most stable reasoning improvements, whereas overly hard problems often provide weak learning s","authors_text":"Jiajun Zhang, Weiwei Xing, Xiaohui Gao, Yue Cheng, Zhanxing Zhu, Zheng Wang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T12:25:57Z","title":"Mechanistically Interpreting the Role of Sample Difficulty in RLVR for LLMs"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28388","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:963aa421f8c44282da6d77f7d5a4ac084eb300a909884357ffc1a2998bf57c17","target":"record","created_at":"2026-05-28T01:05:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"034a83825d0962298fb22be8375c79501a808ddc0cd29f602d637d7a534aa26b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-27T12:25:57Z","title_canon_sha256":"a171ea4e8538f4e0c39ebfb85e107b69668b0719a288b8365497839de571b993"},"schema_version":"1.0","source":{"id":"2605.28388","kind":"arxiv","version":1}},"canonical_sha256":"6e17630917f2a83401430c581b7457c004c7ae8447f0590e270eb8e55584553d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6e17630917f2a83401430c581b7457c004c7ae8447f0590e270eb8e55584553d","first_computed_at":"2026-05-28T01:05:16.806529Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-28T01:05:16.806529Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"vjsW+EQ7D10624BxZZwYSFhlGerbEmphYO7FBqN+ULu01PDUnDBVyrHcmiC6zyvjn5BnTJ/pXGTPXHZFcXTFAA==","signature_status":"signed_v1","signed_at":"2026-05-28T01:05:16.806932Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.28388","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:963aa421f8c44282da6d77f7d5a4ac084eb300a909884357ffc1a2998bf57c17","sha256:87af40c77f93652bfa59ebef54d12971e9e7a48fe4d2d4299ef6fbc25c0f9ab8"],"state_sha256":"84f36dc182580a6c6b4534996107b42d68ee9ea14959b381dcee8556dd99cea9"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"LKtsMKh+7XP5dtpzawV3MmQ8PfpjlgJxuiXkwt8m+EApHhsog3b0/p33kOjgwMQa5bKC7eQxCSDn19jAbQ9OBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T23:37:20.226586Z","bundle_sha256":"60dbeb1aa88469bdbe85fe416c8c397a2d521b7c4bbe64053b1f64ddc70ca1d8"}}