{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:3GAQO7L74E62YPHLYW3LFBG5AH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"2d760fccce85bc063055b0ea60079fa9ccb59b2770e00921ff74b8b5db83b522","cross_cats_sorted":["cs.SY","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-08T13:30:48Z","title_canon_sha256":"5929593190946b3abbe1ccddc9f18ee0fa404419e53f2c93a7335d3384504eaf"},"schema_version":"1.0","source":{"id":"1806.03145","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.03145","created_at":"2026-05-18T00:13:49Z"},{"alias_kind":"arxiv_version","alias_value":"1806.03145v1","created_at":"2026-05-18T00:13:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.03145","created_at":"2026-05-18T00:13:49Z"},{"alias_kind":"pith_short_12","alias_value":"3GAQO7L74E62","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3GAQO7L74E62YPHL","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3GAQO7L7","created_at":"2026-05-18T12:32:02Z"}],"graph_snapshots":[{"event_id":"sha256:34260005c67c9badc6da7fb0c8b6a981e79f7ef753503fa6063d152e826fcd2a","target":"graph","created_at":"2026-05-18T00:13:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The balance between exploration and exploitation is a key problem for reinforcement learning methods, especially for Q-learning. In this paper, a fidelity-based probabilistic Q-learning (FPQL) approach is presented to naturally solve this problem and applied for learning control of quantum systems. In this approach, fidelity is adopted to help direct the learning process and the probability of each action to be selected at a certain state is updated iteratively along with the learning process, which leads to a natural exploration strategy instead of a pointed one with configured parameters. A ","authors_text":"Chunlin Chen, Daoyi Dong, Han-Xiong Li, Jian Chu, Tzyh-Jong Tarn","cross_cats":["cs.SY","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-08T13:30:48Z","title":"Fidelity-based Probabilistic Q-learning for Control of Quantum Systems"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.03145","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:cf17669aa080caf5b85307226c38d2e7075edd937b4dc04c30f7bb589d21c4bb","target":"record","created_at":"2026-05-18T00:13:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"2d760fccce85bc063055b0ea60079fa9ccb59b2770e00921ff74b8b5db83b522","cross_cats_sorted":["cs.SY","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-08T13:30:48Z","title_canon_sha256":"5929593190946b3abbe1ccddc9f18ee0fa404419e53f2c93a7335d3384504eaf"},"schema_version":"1.0","source":{"id":"1806.03145","kind":"arxiv","version":1}},"canonical_sha256":"d981077d7fe13dac3cebc5b6b284dd01c04371ce6d0262b13c0fb4a1a49fd2ba","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d981077d7fe13dac3cebc5b6b284dd01c04371ce6d0262b13c0fb4a1a49fd2ba","first_computed_at":"2026-05-18T00:13:49.507843Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:13:49.507843Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"tiZbU6S84S/LWwTmdlNLb3adRM4bzXnrXW4tkis62G75LDeung2oCaHVjn3bXF4Xk90PivY8t5/N3bFb9N9JCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:13:49.508573Z","signed_message":"canonical_sha256_bytes"},"source_id":"1806.03145","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:cf17669aa080caf5b85307226c38d2e7075edd937b4dc04c30f7bb589d21c4bb","sha256:34260005c67c9badc6da7fb0c8b6a981e79f7ef753503fa6063d152e826fcd2a"],"state_sha256":"e7891a3f0c0f8e496723a01d4dd7198efe00f85dc778f25de9baa0564fa109ab"}