{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:V5D3YYHLRXEI3JURQPZTKSERIT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"10a3449a35287798e9793c6b3b3cd3c65d2fa927c3c34a5ed7ce48c59177abff","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-11T19:36:17Z","title_canon_sha256":"eace06213e7ecc84cce3797602321a3d5158715e2e33954edb12cb0a29747ebe"},"schema_version":"1.0","source":{"id":"2506.10138","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2506.10138","created_at":"2026-05-28T01:04:07Z"},{"alias_kind":"arxiv_version","alias_value":"2506.10138v3","created_at":"2026-05-28T01:04:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2506.10138","created_at":"2026-05-28T01:04:07Z"},{"alias_kind":"pith_short_12","alias_value":"V5D3YYHLRXEI","created_at":"2026-05-28T01:04:07Z"},{"alias_kind":"pith_short_16","alias_value":"V5D3YYHLRXEI3JUR","created_at":"2026-05-28T01:04:07Z"},{"alias_kind":"pith_short_8","alias_value":"V5D3YYHL","created_at":"2026-05-28T01:04:07Z"}],"graph_snapshots":[{"event_id":"sha256:391f5af03cbbe7475fcd377882fb3f820ffb585741c0a60074cbcfdb0a7266aa","target":"graph","created_at":"2026-05-28T01:04:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2506.10138/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We partially reverse-engineer a convolutional recurrent neural network (RNN) trained with model-free reinforcement learning to play the box-pushing game Sokoban. We find that the RNN stores future moves (plans) as activations in particular channels of the hidden state, which we call path channels. A high activation in a particular location means that, when a box is in that location, it will get pushed in the channel's assigned direction. We examine the convolutional kernels between path channels and find that they encode the change in position resulting from each possible action, thus represen","authors_text":"Aaron David Tucker, Adam Gleave, Adri\\`a Garriga-Alonso, Mohammad Taufeeque","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-11T19:36:17Z","title":"Path Channels and Plan Extension Kernels: a Mechanistic Description of Planning in a Sokoban RNN"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2506.10138","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:257f5262037d1626ff0978fe2d8dc71d8bce0ce091ff46f28ef490ca813f0ab1","target":"record","created_at":"2026-05-28T01:04:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"10a3449a35287798e9793c6b3b3cd3c65d2fa927c3c34a5ed7ce48c59177abff","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-11T19:36:17Z","title_canon_sha256":"eace06213e7ecc84cce3797602321a3d5158715e2e33954edb12cb0a29747ebe"},"schema_version":"1.0","source":{"id":"2506.10138","kind":"arxiv","version":3}},"canonical_sha256":"af47bc60eb8dc88da69183f335489144edebaacc6a2c37a2db6962a2a2f6f5fb","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"af47bc60eb8dc88da69183f335489144edebaacc6a2c37a2db6962a2a2f6f5fb","first_computed_at":"2026-05-28T01:04:07.292886Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-28T01:04:07.292886Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"i9Wbgwj0l29QuGxUKY9hTTh5xAo9k+fFdt6ARVL1T58IGWmInAmufIur6wNctW5Rgz3WnTLTn1kPzVkE+mN6Bw==","signature_status":"signed_v1","signed_at":"2026-05-28T01:04:07.293834Z","signed_message":"canonical_sha256_bytes"},"source_id":"2506.10138","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:257f5262037d1626ff0978fe2d8dc71d8bce0ce091ff46f28ef490ca813f0ab1","sha256:391f5af03cbbe7475fcd377882fb3f820ffb585741c0a60074cbcfdb0a7266aa"],"state_sha256":"cf23285dd6ffe7817a4fa1f5860280e289c7e7c99b4e458af3075478fa10b31d"}