{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:O4CGJ6QRY3JCRFGULHCDFBXSCY","short_pith_number":"pith:O4CGJ6QR","schema_version":"1.0","canonical_sha256":"770464fa11c6d22894d459c43286f216345e51725490cd1e389adcdb0166f88f","source":{"kind":"arxiv","id":"1711.11165","version":1},"attestation_state":"computed","paper":{"title":"Safe Exploration for Identifying Linear Systems via Robust Optimization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.SY"],"primary_cat":"cs.LG","authors_text":"Binz Roy, Craig Boutilier, Dale Schuurmans, Martin Zinkevich, Tyler Lu","submitted_at":"2017-11-30T00:13:28Z","abstract_excerpt":"Safely exploring an unknown dynamical system is critical to the deployment of reinforcement learning (RL) in physical systems where failures may have catastrophic consequences. In scenarios where one knows little about the dynamics, diverse transition data covering relevant regions of state-action space is needed to apply either model-based or model-free RL. Motivated by the cooling of Google's data centers, we study how one can safely identify the parameters of a system model with a desired accuracy and confidence level. In particular, we focus on learning an unknown linear system with Gaussi"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1711.11165","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-30T00:13:28Z","cross_cats_sorted":["cs.SY"],"title_canon_sha256":"4001e7290aee5cf3bd4ab9ea46c61dd89b8055db58f51de3eb733a75a43ae12f","abstract_canon_sha256":"d33495eef961d49eb4fe09cfe47f3fca7dddeb6bdeea8e986d936670da0dbce4"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:29:12.293232Z","signature_b64":"MgGXfnliVnSfd7ln9nbMZwCDO3Ani4duG9pZYXPqDCybN7rbA8Bj9fCKdHLCbSfyX+Yqvz/zod+Llsu5tQPADg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"770464fa11c6d22894d459c43286f216345e51725490cd1e389adcdb0166f88f","last_reissued_at":"2026-05-18T00:29:12.292695Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:29:12.292695Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Safe Exploration for Identifying Linear Systems via Robust Optimization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.SY"],"primary_cat":"cs.LG","authors_text":"Binz Roy, Craig Boutilier, Dale Schuurmans, Martin Zinkevich, Tyler Lu","submitted_at":"2017-11-30T00:13:28Z","abstract_excerpt":"Safely exploring an unknown dynamical system is critical to the deployment of reinforcement learning (RL) in physical systems where failures may have catastrophic consequences. In scenarios where one knows little about the dynamics, diverse transition data covering relevant regions of state-action space is needed to apply either model-based or model-free RL. Motivated by the cooling of Google's data centers, we study how one can safely identify the parameters of a system model with a desired accuracy and confidence level. In particular, we focus on learning an unknown linear system with Gaussi"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.11165","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1711.11165","created_at":"2026-05-18T00:29:12.292781+00:00"},{"alias_kind":"arxiv_version","alias_value":"1711.11165v1","created_at":"2026-05-18T00:29:12.292781+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.11165","created_at":"2026-05-18T00:29:12.292781+00:00"},{"alias_kind":"pith_short_12","alias_value":"O4CGJ6QRY3JC","created_at":"2026-05-18T12:31:34.259226+00:00"},{"alias_kind":"pith_short_16","alias_value":"O4CGJ6QRY3JCRFGU","created_at":"2026-05-18T12:31:34.259226+00:00"},{"alias_kind":"pith_short_8","alias_value":"O4CGJ6QR","created_at":"2026-05-18T12:31:34.259226+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY","json":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY.json","graph_json":"https://pith.science/api/pith-number/O4CGJ6QRY3JCRFGULHCDFBXSCY/graph.json","events_json":"https://pith.science/api/pith-number/O4CGJ6QRY3JCRFGULHCDFBXSCY/events.json","paper":"https://pith.science/paper/O4CGJ6QR"},"agent_actions":{"view_html":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY","download_json":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY.json","view_paper":"https://pith.science/paper/O4CGJ6QR","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1711.11165&json=true","fetch_graph":"https://pith.science/api/pith-number/O4CGJ6QRY3JCRFGULHCDFBXSCY/graph.json","fetch_events":"https://pith.science/api/pith-number/O4CGJ6QRY3JCRFGULHCDFBXSCY/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY/action/timestamp_anchor","attest_storage":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY/action/storage_attestation","attest_author":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY/action/author_attestation","sign_citation":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY/action/citation_signature","submit_replication":"https://pith.science/pith/O4CGJ6QRY3JCRFGULHCDFBXSCY/action/replication_record"}},"created_at":"2026-05-18T00:29:12.292781+00:00","updated_at":"2026-05-18T00:29:12.292781+00:00"}