{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:2DHGSTSVYIU6RI43U2N2P22NPO","short_pith_number":"pith:2DHGSTSV","canonical_record":{"source":{"id":"1904.01806","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-03T07:15:46Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"a9eebc45772dfca5c74b11ab1dd0899e79faf4a4e556a97a23696769ea63b21d","abstract_canon_sha256":"d8adeef1432bef0c4fff3a3fd566286328d21194f5998dac62ee015408127a2c"},"schema_version":"1.0"},"canonical_sha256":"d0ce694e55c229e8a39ba69ba7eb4d7bbc14ac4eee7c4ea0977d528f45365e0d","source":{"kind":"arxiv","id":"1904.01806","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.01806","created_at":"2026-05-17T23:49:29Z"},{"alias_kind":"arxiv_version","alias_value":"1904.01806v1","created_at":"2026-05-17T23:49:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.01806","created_at":"2026-05-17T23:49:29Z"},{"alias_kind":"pith_short_12","alias_value":"2DHGSTSVYIU6","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"2DHGSTSVYIU6RI43","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"2DHGSTSV","created_at":"2026-05-18T12:33:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:2DHGSTSVYIU6RI43U2N2P22NPO","target":"record","payload":{"canonical_record":{"source":{"id":"1904.01806","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-03T07:15:46Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"a9eebc45772dfca5c74b11ab1dd0899e79faf4a4e556a97a23696769ea63b21d","abstract_canon_sha256":"d8adeef1432bef0c4fff3a3fd566286328d21194f5998dac62ee015408127a2c"},"schema_version":"1.0"},"canonical_sha256":"d0ce694e55c229e8a39ba69ba7eb4d7bbc14ac4eee7c4ea0977d528f45365e0d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:49:29.614715Z","signature_b64":"VWJn58OzklCwH4ATamxv2wlFgTdfOjrszeW1yvUTp9a4Xh+yWQbrDM8K21lmlmIgM4ewz4fZNU/PdPqqrX4lCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d0ce694e55c229e8a39ba69ba7eb4d7bbc14ac4eee7c4ea0977d528f45365e0d","last_reissued_at":"2026-05-17T23:49:29.614074Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:49:29.614074Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1904.01806","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:49:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"4cD6TJ2qACHpQWCLNR50MzwsY3Gi+eqBWjN9rYE5zxV6X29YQR8XbwEvyn+qSSho9wxFZTyF+GTTEK4RIiayBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T21:33:55.682884Z"},"content_sha256":"dfde355d9aa37607ebfdcdd8e7a7f45505fc402464389010f7090c5a4a60ea62","schema_version":"1.0","event_id":"sha256:dfde355d9aa37607ebfdcdd8e7a7f45505fc402464389010f7090c5a4a60ea62"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:2DHGSTSVYIU6RI43U2N2P22NPO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Deep Reinforcement Learning on a Budget: 3D Control and Reasoning Without a Supercomputer","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Christian Wolf, Edward Beeching, Jilles Dibangoye, Olivier Simonin","submitted_at":"2019-04-03T07:15:46Z","abstract_excerpt":"An important goal of research in Deep Reinforcement Learning in mobile robotics is to train agents capable of solving complex tasks, which require a high level of scene understanding and reasoning from an egocentric perspective. When trained from simulations, optimal environments should satisfy a currently unobtainable combination of high-fidelity photographic observations, massive amounts of different environment configurations and fast simulation speeds. In this paper we argue that research on training agents capable of complex reasoning can be simplified by decoupling from the requirement o"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.01806","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:49:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1ZvZeon8/pGUTOPGixbIpmNNvT/IqaNKM/VWeXFHSRjnund7Ae7pXsiT4vJqqt9KRFz15tvk4zeoXlfuO68BBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T21:33:55.683248Z"},"content_sha256":"63cf02cbb688a4546dedc500fcafea3bf4107efc1563afb07c0f4fc8773151d5","schema_version":"1.0","event_id":"sha256:63cf02cbb688a4546dedc500fcafea3bf4107efc1563afb07c0f4fc8773151d5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2DHGSTSVYIU6RI43U2N2P22NPO/bundle.json","state_url":"https://pith.science/pith/2DHGSTSVYIU6RI43U2N2P22NPO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2DHGSTSVYIU6RI43U2N2P22NPO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T21:33:55Z","links":{"resolver":"https://pith.science/pith/2DHGSTSVYIU6RI43U2N2P22NPO","bundle":"https://pith.science/pith/2DHGSTSVYIU6RI43U2N2P22NPO/bundle.json","state":"https://pith.science/pith/2DHGSTSVYIU6RI43U2N2P22NPO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2DHGSTSVYIU6RI43U2N2P22NPO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:2DHGSTSVYIU6RI43U2N2P22NPO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d8adeef1432bef0c4fff3a3fd566286328d21194f5998dac62ee015408127a2c","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-03T07:15:46Z","title_canon_sha256":"a9eebc45772dfca5c74b11ab1dd0899e79faf4a4e556a97a23696769ea63b21d"},"schema_version":"1.0","source":{"id":"1904.01806","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1904.01806","created_at":"2026-05-17T23:49:29Z"},{"alias_kind":"arxiv_version","alias_value":"1904.01806v1","created_at":"2026-05-17T23:49:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1904.01806","created_at":"2026-05-17T23:49:29Z"},{"alias_kind":"pith_short_12","alias_value":"2DHGSTSVYIU6","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_16","alias_value":"2DHGSTSVYIU6RI43","created_at":"2026-05-18T12:33:07Z"},{"alias_kind":"pith_short_8","alias_value":"2DHGSTSV","created_at":"2026-05-18T12:33:07Z"}],"graph_snapshots":[{"event_id":"sha256:63cf02cbb688a4546dedc500fcafea3bf4107efc1563afb07c0f4fc8773151d5","target":"graph","created_at":"2026-05-17T23:49:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"An important goal of research in Deep Reinforcement Learning in mobile robotics is to train agents capable of solving complex tasks, which require a high level of scene understanding and reasoning from an egocentric perspective. When trained from simulations, optimal environments should satisfy a currently unobtainable combination of high-fidelity photographic observations, massive amounts of different environment configurations and fast simulation speeds. In this paper we argue that research on training agents capable of complex reasoning can be simplified by decoupling from the requirement o","authors_text":"Christian Wolf, Edward Beeching, Jilles Dibangoye, Olivier Simonin","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-03T07:15:46Z","title":"Deep Reinforcement Learning on a Budget: 3D Control and Reasoning Without a Supercomputer"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1904.01806","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:dfde355d9aa37607ebfdcdd8e7a7f45505fc402464389010f7090c5a4a60ea62","target":"record","created_at":"2026-05-17T23:49:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d8adeef1432bef0c4fff3a3fd566286328d21194f5998dac62ee015408127a2c","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2019-04-03T07:15:46Z","title_canon_sha256":"a9eebc45772dfca5c74b11ab1dd0899e79faf4a4e556a97a23696769ea63b21d"},"schema_version":"1.0","source":{"id":"1904.01806","kind":"arxiv","version":1}},"canonical_sha256":"d0ce694e55c229e8a39ba69ba7eb4d7bbc14ac4eee7c4ea0977d528f45365e0d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d0ce694e55c229e8a39ba69ba7eb4d7bbc14ac4eee7c4ea0977d528f45365e0d","first_computed_at":"2026-05-17T23:49:29.614074Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:49:29.614074Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"VWJn58OzklCwH4ATamxv2wlFgTdfOjrszeW1yvUTp9a4Xh+yWQbrDM8K21lmlmIgM4ewz4fZNU/PdPqqrX4lCQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:49:29.614715Z","signed_message":"canonical_sha256_bytes"},"source_id":"1904.01806","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:dfde355d9aa37607ebfdcdd8e7a7f45505fc402464389010f7090c5a4a60ea62","sha256:63cf02cbb688a4546dedc500fcafea3bf4107efc1563afb07c0f4fc8773151d5"],"state_sha256":"98ac3c3a0dabd6f710bbeb648f3b43211f7103e4c941e188c5f3011b928e80ed"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mh0BgAw0k3xjCKcpcW3gaAAwix5heoR5lpqHHns5b3SDWbXgOoDVQfmM3cokYf/XYsuLfG98A0FmUgpmsR1lAQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T21:33:55.685456Z","bundle_sha256":"19bd88a9b71b3aee5a035bc0b0e7648b61259665c5b930e27f972c52ab3f7c73"}}