{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:FNIT7S4BFV3NCVHLSCH54SPK2M","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f05d71bc8bd1c7ca9f458a951011cea618d51825d6e9cb322075d686f1a0c1da","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2019-04-14T18:18:45Z","title_canon_sha256":"2b2b61b4356a913f180b449e52a57edf1e1a7936291bf48d3d380e4a2b3c0af7"},"schema_version":"1.0","source":{"id":"1904.06736","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.06736","created_at":"2026-05-17T23:48:29Z"},{"alias_kind":"arxiv_version","alias_value":"1904.06736v1","created_at":"2026-05-17T23:48:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.06736","created_at":"2026-05-17T23:48:29Z"},{"alias_kind":"pith_short_12","alias_value":"FNIT7S4BFV3N","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_16","alias_value":"FNIT7S4BFV3NCVHL","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_8","alias_value":"FNIT7S4B","created_at":"2026-05-18T12:33:15Z"}],"graph_snapshots":[{"event_id":"sha256:6d04837b2932757d211fb8990407b0d6aeec774271ed164cb76d30384b2c993b","target":"graph","created_at":"2026-05-17T23:48:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Reinforcement learning (RL) is a branch of machine learning which is employed to solve various sequential decision making problems without proper supervision. Due to the recent advancement of deep learning, the newly proposed Deep-RL algorithms have been able to perform extremely well in sophisticated high-dimensional environments. However, even after successes in many domains, one of the major challenge in these approaches is the high magnitude of interactions with the environment required for efficient decision making. Seeking inspiration from the brain, this problem can be solved by incorpo","authors_text":"Dhruv Ramani","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2019-04-14T18:18:45Z","title":"A Short Survey On Memory Based Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.06736","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3065a7a4ba7223b00fcbb8d0b763999786fae11969d655ddf02bc03361353dca","target":"record","created_at":"2026-05-17T23:48:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f05d71bc8bd1c7ca9f458a951011cea618d51825d6e9cb322075d686f1a0c1da","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2019-04-14T18:18:45Z","title_canon_sha256":"2b2b61b4356a913f180b449e52a57edf1e1a7936291bf48d3d380e4a2b3c0af7"},"schema_version":"1.0","source":{"id":"1904.06736","kind":"arxiv","version":1}},"canonical_sha256":"2b513fcb812d76d154eb908fde49ead33218f1ecc149cb43d5887389cd853cf9","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2b513fcb812d76d154eb908fde49ead33218f1ecc149cb43d5887389cd853cf9","first_computed_at":"2026-05-17T23:48:29.277432Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:48:29.277432Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"dIyYVCPBqBbtSBQ4H4tcmdir8WtQFzkaFBgKfeeKRdZh1/iINpsv/c2xvJQFWU4myGegdxDPNnJsK0HjbNUfCw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:48:29.278076Z","signed_message":"canonical_sha256_bytes"},"source_id":"1904.06736","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3065a7a4ba7223b00fcbb8d0b763999786fae11969d655ddf02bc03361353dca","sha256:6d04837b2932757d211fb8990407b0d6aeec774271ed164cb76d30384b2c993b"],"state_sha256":"b57b5a1fbe10f3779e9c9d56c6831a235e39d1881c138c4893d87204170cdbc5"}