{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:NIAGMWQYSJDPWAI6JEYSJJCF64","short_pith_number":"pith:NIAGMWQY","canonical_record":{"source":{"id":"2605.18185","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-18T10:26:50Z","cross_cats_sorted":[],"title_canon_sha256":"ddde89a0bf3f87a749edc800cb6aef0f0d47a7724ad7cb4d2a2d33e095d862f1","abstract_canon_sha256":"64d8dd4256561d73340d01650c7e50bea2d3d16a92a558c245426d38f858fc5a"},"schema_version":"1.0"},"canonical_sha256":"6a00665a189246fb011e493124a445f7288ce42dcccc4a1ec0bef51b5da41ee2","source":{"kind":"arxiv","id":"2605.18185","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18185","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18185v1","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18185","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"pith_short_12","alias_value":"NIAGMWQYSJDP","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"pith_short_16","alias_value":"NIAGMWQYSJDPWAI6","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"pith_short_8","alias_value":"NIAGMWQY","created_at":"2026-05-20T00:05:49Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:NIAGMWQYSJDPWAI6JEYSJJCF64","target":"record","payload":{"canonical_record":{"source":{"id":"2605.18185","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-18T10:26:50Z","cross_cats_sorted":[],"title_canon_sha256":"ddde89a0bf3f87a749edc800cb6aef0f0d47a7724ad7cb4d2a2d33e095d862f1","abstract_canon_sha256":"64d8dd4256561d73340d01650c7e50bea2d3d16a92a558c245426d38f858fc5a"},"schema_version":"1.0"},"canonical_sha256":"6a00665a189246fb011e493124a445f7288ce42dcccc4a1ec0bef51b5da41ee2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:05:49.763666Z","signature_b64":"hrByDo1OIqXm1sqgDsaM87b6o1GE4CBmThP3tXID7oVMjqeJEKMDaR9gVrcLeGvF0ernELOhBEvhFEnkxSaJCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6a00665a189246fb011e493124a445f7288ce42dcccc4a1ec0bef51b5da41ee2","last_reissued_at":"2026-05-20T00:05:49.763054Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:05:49.763054Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.18185","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:05:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QDw5lrB/2J+OwFaB7PE707aKCE2a2DAnw5Hwt/QDx1nOyYajBaTk889oPfjpblqnU1uCNWYERPGdBcBmyh3IAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T20:16:46.076708Z"},"content_sha256":"5637a1d97f6efc4c3a97b2327596fbaf618bf395881bf628c1cb2a9f4855c787","schema_version":"1.0","event_id":"sha256:5637a1d97f6efc4c3a97b2327596fbaf618bf395881bf628c1cb2a9f4855c787"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:NIAGMWQYSJDPWAI6JEYSJJCF64","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"The Dynamics of Policy Gradient in Social Dilemmas with Partner Selection","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.MA","authors_text":"Benedict Russell, Chin-wing Leung, Paolo Turrini","submitted_at":"2026-05-18T10:26:50Z","abstract_excerpt":"In social dilemmas self-interested learning agents face the choice between the societal benefit of cooperation and the immediate reward of defection. Significant evidence exists on the benefits of assortment mechanisms such as partner selection for the emergence of cooperation, but this is largely available through agent-based simulations. In this paper, we provide an analytical solution to the problem, studying the policy-gradient dynamics in a multi-agent environment with partner selection. We show how partner selection changes the opponent distribution and hence the reward landscape, and pr"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18185","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18185/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"claim_evidence","ran_at":"2026-05-19T23:41:59.020661Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"ai_meta_artifact","ran_at":"2026-05-19T23:33:35.338585Z","status":"skipped","version":"1.0.0","findings_count":0}],"snapshot_sha256":"ff51fd67fdef37cbf31341eaa2d23e8164384601b6b5400129ba9a4a4d69bf24"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:05:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uNSRoLnavJb1Q+9xB3d62OBgsQkmsd8gPmoaiUAWwg+yGsYSLaOySZIgnDnOEyyIdsLDsfcE7/KLOfcy63gEDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T20:16:46.077515Z"},"content_sha256":"2d2df6ad80e1fb8deb53bdeb443609d7b49f273584693e4cfa64b072325d385c","schema_version":"1.0","event_id":"sha256:2d2df6ad80e1fb8deb53bdeb443609d7b49f273584693e4cfa64b072325d385c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NIAGMWQYSJDPWAI6JEYSJJCF64/bundle.json","state_url":"https://pith.science/pith/NIAGMWQYSJDPWAI6JEYSJJCF64/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NIAGMWQYSJDPWAI6JEYSJJCF64/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T20:16:46Z","links":{"resolver":"https://pith.science/pith/NIAGMWQYSJDPWAI6JEYSJJCF64","bundle":"https://pith.science/pith/NIAGMWQYSJDPWAI6JEYSJJCF64/bundle.json","state":"https://pith.science/pith/NIAGMWQYSJDPWAI6JEYSJJCF64/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NIAGMWQYSJDPWAI6JEYSJJCF64/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:NIAGMWQYSJDPWAI6JEYSJJCF64","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"64d8dd4256561d73340d01650c7e50bea2d3d16a92a558c245426d38f858fc5a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-18T10:26:50Z","title_canon_sha256":"ddde89a0bf3f87a749edc800cb6aef0f0d47a7724ad7cb4d2a2d33e095d862f1"},"schema_version":"1.0","source":{"id":"2605.18185","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18185","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18185v1","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18185","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"pith_short_12","alias_value":"NIAGMWQYSJDP","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"pith_short_16","alias_value":"NIAGMWQYSJDPWAI6","created_at":"2026-05-20T00:05:49Z"},{"alias_kind":"pith_short_8","alias_value":"NIAGMWQY","created_at":"2026-05-20T00:05:49Z"}],"graph_snapshots":[{"event_id":"sha256:2d2df6ad80e1fb8deb53bdeb443609d7b49f273584693e4cfa64b072325d385c","target":"graph","created_at":"2026-05-20T00:05:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-19T23:41:59.020661Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-19T23:33:35.338585Z","status":"skipped","version":"1.0.0"}],"endpoint":"/pith/2605.18185/integrity.json","findings":[],"snapshot_sha256":"ff51fd67fdef37cbf31341eaa2d23e8164384601b6b5400129ba9a4a4d69bf24","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In social dilemmas self-interested learning agents face the choice between the societal benefit of cooperation and the immediate reward of defection. Significant evidence exists on the benefits of assortment mechanisms such as partner selection for the emergence of cooperation, but this is largely available through agent-based simulations. In this paper, we provide an analytical solution to the problem, studying the policy-gradient dynamics in a multi-agent environment with partner selection. We show how partner selection changes the opponent distribution and hence the reward landscape, and pr","authors_text":"Benedict Russell, Chin-wing Leung, Paolo Turrini","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-18T10:26:50Z","title":"The Dynamics of Policy Gradient in Social Dilemmas with Partner Selection"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18185","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5637a1d97f6efc4c3a97b2327596fbaf618bf395881bf628c1cb2a9f4855c787","target":"record","created_at":"2026-05-20T00:05:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"64d8dd4256561d73340d01650c7e50bea2d3d16a92a558c245426d38f858fc5a","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.MA","submitted_at":"2026-05-18T10:26:50Z","title_canon_sha256":"ddde89a0bf3f87a749edc800cb6aef0f0d47a7724ad7cb4d2a2d33e095d862f1"},"schema_version":"1.0","source":{"id":"2605.18185","kind":"arxiv","version":1}},"canonical_sha256":"6a00665a189246fb011e493124a445f7288ce42dcccc4a1ec0bef51b5da41ee2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6a00665a189246fb011e493124a445f7288ce42dcccc4a1ec0bef51b5da41ee2","first_computed_at":"2026-05-20T00:05:49.763054Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:05:49.763054Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"hrByDo1OIqXm1sqgDsaM87b6o1GE4CBmThP3tXID7oVMjqeJEKMDaR9gVrcLeGvF0ernELOhBEvhFEnkxSaJCg==","signature_status":"signed_v1","signed_at":"2026-05-20T00:05:49.763666Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.18185","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5637a1d97f6efc4c3a97b2327596fbaf618bf395881bf628c1cb2a9f4855c787","sha256:2d2df6ad80e1fb8deb53bdeb443609d7b49f273584693e4cfa64b072325d385c"],"state_sha256":"4114aef5530528f48432a2b311853e2addd6b1f7a7fe3f31d7cbf29434fb8f52"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"siD1FJw43QVdki4v+ZN0wW1EC0ClbGHuXFAw5i2pp6zZw4SjlWNMKjI+bmf97gjwZpokJTUiY8ObUSxHbX70Bw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T20:16:46.081346Z","bundle_sha256":"06e6d9b1ecebd16bd8974811ae8c04c2a27c4b0e086e3e144db8370b231e5bae"}}