{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:FW3P5GL42MOCZ54XSH7MRVAFFZ","short_pith_number":"pith:FW3P5GL4","canonical_record":{"source":{"id":"1705.07177","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-05-19T20:38:49Z","cross_cats_sorted":[],"title_canon_sha256":"121b4c9d571688c9b8f371bbfbd970c9d21af36b2a9d64ecc2796e6bdae9eb83","abstract_canon_sha256":"3db628a2f9d67e7a89e608da875adcc7cfac1665afacddbffdade88a47e03ea3"},"schema_version":"1.0"},"canonical_sha256":"2db6fe997cd31c2cf79791fec8d4052e565bc2a29990bb68a979ae1e960a22cf","source":{"kind":"arxiv","id":"1705.07177","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.07177","created_at":"2026-05-18T00:19:17Z"},{"alias_kind":"arxiv_version","alias_value":"1705.07177v2","created_at":"2026-05-18T00:19:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.07177","created_at":"2026-05-18T00:19:17Z"},{"alias_kind":"pith_short_12","alias_value":"FW3P5GL42MOC","created_at":"2026-05-18T12:31:15Z"},{"alias_kind":"pith_short_16","alias_value":"FW3P5GL42MOCZ54X","created_at":"2026-05-18T12:31:15Z"},{"alias_kind":"pith_short_8","alias_value":"FW3P5GL4","created_at":"2026-05-18T12:31:15Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:FW3P5GL42MOCZ54XSH7MRVAFFZ","target":"record","payload":{"canonical_record":{"source":{"id":"1705.07177","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-05-19T20:38:49Z","cross_cats_sorted":[],"title_canon_sha256":"121b4c9d571688c9b8f371bbfbd970c9d21af36b2a9d64ecc2796e6bdae9eb83","abstract_canon_sha256":"3db628a2f9d67e7a89e608da875adcc7cfac1665afacddbffdade88a47e03ea3"},"schema_version":"1.0"},"canonical_sha256":"2db6fe997cd31c2cf79791fec8d4052e565bc2a29990bb68a979ae1e960a22cf","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:19:17.230618Z","signature_b64":"IWV2mW7tBcpuNSMpNti/y4oWZPrydguUoa9k1H1f21cfrQuIgTYXX719nRHBtuf4BC6GCRfPT3sDbq1svb9qBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"2db6fe997cd31c2cf79791fec8d4052e565bc2a29990bb68a979ae1e960a22cf","last_reissued_at":"2026-05-18T00:19:17.230049Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:19:17.230049Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1705.07177","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:19:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"q7s+OjYvrZZonf/PKMVsB5zoJdrxtQ4qqm0EAFvtnxXijkcgIwCX1Atg0XiQSREm7sm3zDVjfJMc0ZEZGe7PBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T23:24:32.640243Z"},"content_sha256":"c8f67f830ad056474d13423c4b0c5fb1c6c603fe36be926be920fa6a3c6f3dbf","schema_version":"1.0","event_id":"sha256:c8f67f830ad056474d13423c4b0c5fb1c6c603fe36be926be920fa6a3c6f3dbf"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:FW3P5GL42MOCZ54XSH7MRVAFFZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Model-Based Planning with Discrete and Continuous Actions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Mikael Henaff, William F. Whitney, Yann LeCun","submitted_at":"2017-05-19T20:38:49Z","abstract_excerpt":"Action planning using learned and differentiable forward models of the world is a general approach which has a number of desirable properties, including improved sample complexity over model-free RL methods, reuse of learned models across different tasks, and the ability to perform efficient gradient-based optimization in continuous action spaces. However, this approach does not apply straightforwardly when the action space is discrete. In this work, we show that it is in fact possible to effectively perform planning via backprop in discrete action spaces, using a simple paramaterization of th"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.07177","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:19:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"s1XV00mxql3j/pklWyAJKIY1NbryWG3yu6C8TJQtIroxaCmExNZ9KbhdgVd7di3I0viVxLsiFzpLIjSvXo/rAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T23:24:32.640908Z"},"content_sha256":"a6995006554c67f392900d649beffb10ada7408422af7d71de816f7cffaabff5","schema_version":"1.0","event_id":"sha256:a6995006554c67f392900d649beffb10ada7408422af7d71de816f7cffaabff5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ/bundle.json","state_url":"https://pith.science/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T23:24:32Z","links":{"resolver":"https://pith.science/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ","bundle":"https://pith.science/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ/bundle.json","state":"https://pith.science/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/FW3P5GL42MOCZ54XSH7MRVAFFZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:FW3P5GL42MOCZ54XSH7MRVAFFZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3db628a2f9d67e7a89e608da875adcc7cfac1665afacddbffdade88a47e03ea3","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-05-19T20:38:49Z","title_canon_sha256":"121b4c9d571688c9b8f371bbfbd970c9d21af36b2a9d64ecc2796e6bdae9eb83"},"schema_version":"1.0","source":{"id":"1705.07177","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.07177","created_at":"2026-05-18T00:19:17Z"},{"alias_kind":"arxiv_version","alias_value":"1705.07177v2","created_at":"2026-05-18T00:19:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.07177","created_at":"2026-05-18T00:19:17Z"},{"alias_kind":"pith_short_12","alias_value":"FW3P5GL42MOC","created_at":"2026-05-18T12:31:15Z"},{"alias_kind":"pith_short_16","alias_value":"FW3P5GL42MOCZ54X","created_at":"2026-05-18T12:31:15Z"},{"alias_kind":"pith_short_8","alias_value":"FW3P5GL4","created_at":"2026-05-18T12:31:15Z"}],"graph_snapshots":[{"event_id":"sha256:a6995006554c67f392900d649beffb10ada7408422af7d71de816f7cffaabff5","target":"graph","created_at":"2026-05-18T00:19:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Action planning using learned and differentiable forward models of the world is a general approach which has a number of desirable properties, including improved sample complexity over model-free RL methods, reuse of learned models across different tasks, and the ability to perform efficient gradient-based optimization in continuous action spaces. However, this approach does not apply straightforwardly when the action space is discrete. In this work, we show that it is in fact possible to effectively perform planning via backprop in discrete action spaces, using a simple paramaterization of th","authors_text":"Mikael Henaff, William F. Whitney, Yann LeCun","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-05-19T20:38:49Z","title":"Model-Based Planning with Discrete and Continuous Actions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.07177","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c8f67f830ad056474d13423c4b0c5fb1c6c603fe36be926be920fa6a3c6f3dbf","target":"record","created_at":"2026-05-18T00:19:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3db628a2f9d67e7a89e608da875adcc7cfac1665afacddbffdade88a47e03ea3","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-05-19T20:38:49Z","title_canon_sha256":"121b4c9d571688c9b8f371bbfbd970c9d21af36b2a9d64ecc2796e6bdae9eb83"},"schema_version":"1.0","source":{"id":"1705.07177","kind":"arxiv","version":2}},"canonical_sha256":"2db6fe997cd31c2cf79791fec8d4052e565bc2a29990bb68a979ae1e960a22cf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"2db6fe997cd31c2cf79791fec8d4052e565bc2a29990bb68a979ae1e960a22cf","first_computed_at":"2026-05-18T00:19:17.230049Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:19:17.230049Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"IWV2mW7tBcpuNSMpNti/y4oWZPrydguUoa9k1H1f21cfrQuIgTYXX719nRHBtuf4BC6GCRfPT3sDbq1svb9qBg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:19:17.230618Z","signed_message":"canonical_sha256_bytes"},"source_id":"1705.07177","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c8f67f830ad056474d13423c4b0c5fb1c6c603fe36be926be920fa6a3c6f3dbf","sha256:a6995006554c67f392900d649beffb10ada7408422af7d71de816f7cffaabff5"],"state_sha256":"8c168c9d11eda332d912e9bf4812b3683ffebe1f8b8d7d82f32a7655c39c001d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Q67Q2v/l0TsmjYQGRmuZdiH1+IPd720BRr1pb2xSD7GL/LjHURkAuVs915YvBfFaBwncd9QLyO/7phA4s9iEAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T23:24:32.644375Z","bundle_sha256":"9f3c583d8fb8628f60e9fbd53af8fc716fcd49c0cf014159bfbb6b687501a0e8"}}