{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:L7QIIC5KICB6OGZ56DXOGVYLB5","short_pith_number":"pith:L7QIIC5K","canonical_record":{"source":{"id":"1606.04460","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-06-14T17:03:46Z","cross_cats_sorted":["cs.LG","q-bio.NC"],"title_canon_sha256":"e9a8b8b5c1a0bc6c261e5ed19d5fc66f6cab73c2bb5efab6c401b20ed8fa3ecc","abstract_canon_sha256":"0fbbdb02e1b005ee8df66fc50e3410ba4c97ccde4b2cd32cb575a0187bd37066"},"schema_version":"1.0"},"canonical_sha256":"5fe0840baa4083e71b3df0eee3570b0f696a2731bec51ba3cc5f6986e4c3a057","source":{"kind":"arxiv","id":"1606.04460","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1606.04460","created_at":"2026-05-18T01:12:25Z"},{"alias_kind":"arxiv_version","alias_value":"1606.04460v1","created_at":"2026-05-18T01:12:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1606.04460","created_at":"2026-05-18T01:12:25Z"},{"alias_kind":"pith_short_12","alias_value":"L7QIIC5KICB6","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_16","alias_value":"L7QIIC5KICB6OGZ5","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_8","alias_value":"L7QIIC5K","created_at":"2026-05-18T12:30:29Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:L7QIIC5KICB6OGZ56DXOGVYLB5","target":"record","payload":{"canonical_record":{"source":{"id":"1606.04460","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-06-14T17:03:46Z","cross_cats_sorted":["cs.LG","q-bio.NC"],"title_canon_sha256":"e9a8b8b5c1a0bc6c261e5ed19d5fc66f6cab73c2bb5efab6c401b20ed8fa3ecc","abstract_canon_sha256":"0fbbdb02e1b005ee8df66fc50e3410ba4c97ccde4b2cd32cb575a0187bd37066"},"schema_version":"1.0"},"canonical_sha256":"5fe0840baa4083e71b3df0eee3570b0f696a2731bec51ba3cc5f6986e4c3a057","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:12:25.585420Z","signature_b64":"zKhVdsdL87EuLOOFc4sUzdVbsQJ0D6PVhmxRHIEQJ7VhbBO/YI4v8Iew43Rg6kGhyoCVMCY6MdYlzCjlQJDNBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5fe0840baa4083e71b3df0eee3570b0f696a2731bec51ba3cc5f6986e4c3a057","last_reissued_at":"2026-05-18T01:12:25.585059Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:12:25.585059Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1606.04460","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:12:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/NQq/kgSfqfmmgV1buz0SVI8u132o92Z6/IQAm8aa1phy58q9BX+M54MU2cdDpWaJf4sl1JvUKuL4PFHdfSnCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T14:30:33.113458Z"},"content_sha256":"956eb378f301278556eb03e7253a5f98f8c7b730cc09dcc1095b6065461fd964","schema_version":"1.0","event_id":"sha256:956eb378f301278556eb03e7253a5f98f8c7b730cc09dcc1095b6065461fd964"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:L7QIIC5KICB6OGZ56DXOGVYLB5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Model-Free Episodic Control","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","q-bio.NC"],"primary_cat":"stat.ML","authors_text":"Alexander Pritzel, Avraham Ruderman, Benigno Uria, Charles Blundell, Daan Wierstra, Demis Hassabis, Jack Rae, Joel Z Leibo, Yazhe Li","submitted_at":"2016-06-14T17:03:46Z","abstract_excerpt":"State of the art deep reinforcement learning algorithms take many millions of interactions to attain human-level performance. Humans, on the other hand, can very quickly exploit highly rewarding nuances of an environment upon first discovery. In the brain, such rapid learning is thought to depend on the hippocampus and its capacity for episodic memory. Here we investigate whether a simple model of hippocampal episodic control can learn to solve difficult sequential decision-making tasks. We demonstrate that it not only attains a highly rewarding strategy significantly faster than state-of-the-"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1606.04460","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:12:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"shzgaqW4vbXLnwRCnscTi0c3rCeKDksKeoM611WSA2P6BM/ggPLyREJUR1E0Z13NZcrTdQPZezD+EJYhExEbDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T14:30:33.113796Z"},"content_sha256":"2ae60983c834da271831e05bb0825267ffc04b8593662ef5dcf3d91b3cabc43e","schema_version":"1.0","event_id":"sha256:2ae60983c834da271831e05bb0825267ffc04b8593662ef5dcf3d91b3cabc43e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/L7QIIC5KICB6OGZ56DXOGVYLB5/bundle.json","state_url":"https://pith.science/pith/L7QIIC5KICB6OGZ56DXOGVYLB5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/L7QIIC5KICB6OGZ56DXOGVYLB5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T14:30:33Z","links":{"resolver":"https://pith.science/pith/L7QIIC5KICB6OGZ56DXOGVYLB5","bundle":"https://pith.science/pith/L7QIIC5KICB6OGZ56DXOGVYLB5/bundle.json","state":"https://pith.science/pith/L7QIIC5KICB6OGZ56DXOGVYLB5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/L7QIIC5KICB6OGZ56DXOGVYLB5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:L7QIIC5KICB6OGZ56DXOGVYLB5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0fbbdb02e1b005ee8df66fc50e3410ba4c97ccde4b2cd32cb575a0187bd37066","cross_cats_sorted":["cs.LG","q-bio.NC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-06-14T17:03:46Z","title_canon_sha256":"e9a8b8b5c1a0bc6c261e5ed19d5fc66f6cab73c2bb5efab6c401b20ed8fa3ecc"},"schema_version":"1.0","source":{"id":"1606.04460","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1606.04460","created_at":"2026-05-18T01:12:25Z"},{"alias_kind":"arxiv_version","alias_value":"1606.04460v1","created_at":"2026-05-18T01:12:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1606.04460","created_at":"2026-05-18T01:12:25Z"},{"alias_kind":"pith_short_12","alias_value":"L7QIIC5KICB6","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_16","alias_value":"L7QIIC5KICB6OGZ5","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_8","alias_value":"L7QIIC5K","created_at":"2026-05-18T12:30:29Z"}],"graph_snapshots":[{"event_id":"sha256:2ae60983c834da271831e05bb0825267ffc04b8593662ef5dcf3d91b3cabc43e","target":"graph","created_at":"2026-05-18T01:12:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"State of the art deep reinforcement learning algorithms take many millions of interactions to attain human-level performance. Humans, on the other hand, can very quickly exploit highly rewarding nuances of an environment upon first discovery. In the brain, such rapid learning is thought to depend on the hippocampus and its capacity for episodic memory. Here we investigate whether a simple model of hippocampal episodic control can learn to solve difficult sequential decision-making tasks. We demonstrate that it not only attains a highly rewarding strategy significantly faster than state-of-the-","authors_text":"Alexander Pritzel, Avraham Ruderman, Benigno Uria, Charles Blundell, Daan Wierstra, Demis Hassabis, Jack Rae, Joel Z Leibo, Yazhe Li","cross_cats":["cs.LG","q-bio.NC"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-06-14T17:03:46Z","title":"Model-Free Episodic Control"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1606.04460","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:956eb378f301278556eb03e7253a5f98f8c7b730cc09dcc1095b6065461fd964","target":"record","created_at":"2026-05-18T01:12:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0fbbdb02e1b005ee8df66fc50e3410ba4c97ccde4b2cd32cb575a0187bd37066","cross_cats_sorted":["cs.LG","q-bio.NC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-06-14T17:03:46Z","title_canon_sha256":"e9a8b8b5c1a0bc6c261e5ed19d5fc66f6cab73c2bb5efab6c401b20ed8fa3ecc"},"schema_version":"1.0","source":{"id":"1606.04460","kind":"arxiv","version":1}},"canonical_sha256":"5fe0840baa4083e71b3df0eee3570b0f696a2731bec51ba3cc5f6986e4c3a057","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5fe0840baa4083e71b3df0eee3570b0f696a2731bec51ba3cc5f6986e4c3a057","first_computed_at":"2026-05-18T01:12:25.585059Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:12:25.585059Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"zKhVdsdL87EuLOOFc4sUzdVbsQJ0D6PVhmxRHIEQJ7VhbBO/YI4v8Iew43Rg6kGhyoCVMCY6MdYlzCjlQJDNBg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:12:25.585420Z","signed_message":"canonical_sha256_bytes"},"source_id":"1606.04460","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:956eb378f301278556eb03e7253a5f98f8c7b730cc09dcc1095b6065461fd964","sha256:2ae60983c834da271831e05bb0825267ffc04b8593662ef5dcf3d91b3cabc43e"],"state_sha256":"9e4896bfd869c57981eae3f8e32e0cc43a044b6042d0049151eac2cf3cbcd948"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WGvIZazWGYTmO5eg07lVYzbz6delindII4r4Pa2l4OxLbLh9y//7QCrqsv9DDBOTRVuMAG6zIRQCbOYq7bDGCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T14:30:33.115649Z","bundle_sha256":"e6becbbef9914e2b0b9653824c0734937840a742894e454317153afcc4119b3c"}}