{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:4NJBO4Q42TVQJ5RXDLWNH6RSDT","short_pith_number":"pith:4NJBO4Q4","canonical_record":{"source":{"id":"1704.04866","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-04-17T04:43:05Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"edc074be2dbb97340a7adaf9c71bfce1135642d44e8a8a669569220869bc14b1","abstract_canon_sha256":"3bd2b0a37feb2772cc8b307ea41a0ed67b80fcfebf1882e039a3ed90e2af1ebf"},"schema_version":"1.0"},"canonical_sha256":"e35217721cd4eb04f6371aecd3fa321cf6644905d5fa79e9af50abf99584d579","source":{"kind":"arxiv","id":"1704.04866","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1704.04866","created_at":"2026-05-18T00:44:08Z"},{"alias_kind":"arxiv_version","alias_value":"1704.04866v3","created_at":"2026-05-18T00:44:08Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1704.04866","created_at":"2026-05-18T00:44:08Z"},{"alias_kind":"pith_short_12","alias_value":"4NJBO4Q42TVQ","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_16","alias_value":"4NJBO4Q42TVQJ5RX","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_8","alias_value":"4NJBO4Q4","created_at":"2026-05-18T12:31:00Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:4NJBO4Q42TVQJ5RXDLWNH6RSDT","target":"record","payload":{"canonical_record":{"source":{"id":"1704.04866","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-04-17T04:43:05Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"edc074be2dbb97340a7adaf9c71bfce1135642d44e8a8a669569220869bc14b1","abstract_canon_sha256":"3bd2b0a37feb2772cc8b307ea41a0ed67b80fcfebf1882e039a3ed90e2af1ebf"},"schema_version":"1.0"},"canonical_sha256":"e35217721cd4eb04f6371aecd3fa321cf6644905d5fa79e9af50abf99584d579","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:44:08.608580Z","signature_b64":"enYOYovk+l38Y2A0aX2bYTvyfBDaeaLDwbrjK6lnAp0hKYuxc5uHPLW7wGaQLPClZE/ZSgKPdbAFijRs370OBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e35217721cd4eb04f6371aecd3fa321cf6644905d5fa79e9af50abf99584d579","last_reissued_at":"2026-05-18T00:44:08.608086Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:44:08.608086Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1704.04866","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:44:08Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kBFNKNjq7PtJ9a7Ymsg4Pp5evnSoLeF7aROnC6oO4+FkugsEyyRDjtqU1TpEAc3O97qrQFbaNuCTZ1tX8tTcCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-26T07:08:54.800470Z"},"content_sha256":"fe18f5b106a0167b27dea5f2e1d89398b2acb3f4342177b67721b68b834d03e6","schema_version":"1.0","event_id":"sha256:fe18f5b106a0167b27dea5f2e1d89398b2acb3f4342177b67721b68b834d03e6"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:4NJBO4Q42TVQJ5RXDLWNH6RSDT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Effective Warm Start for the Online Actor-Critic Reinforcement Learning based mHealth Intervention","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Feiyun Zhu, Peng Liao","submitted_at":"2017-04-17T04:43:05Z","abstract_excerpt":"Online reinforcement learning (RL) is increasingly popular for the personalized mobile health (mHealth) intervention. It is able to personalize the type and dose of interventions according to user's ongoing statuses and changing needs. However, at the beginning of online learning, there are usually too few samples to support the RL updating, which leads to poor performances. A delay in good performance of the online learning algorithms can be especially detrimental in the mHealth, where users tend to quickly disengage with the mHealth app. To address this problem, we propose a new online RL me"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1704.04866","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:44:08Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"wV8jJkuD+OqqxjLI1r+uL98uTU+NrzPpamEVhaAqhFpnIlc2jY8JbEA8T7g3vI4rWV8yvnbePr5GCuQT8aGoCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-26T07:08:54.800822Z"},"content_sha256":"aede41282a85d7e9940303bbfe4b89e573515fa309e1159a5b7a457d1fb30589","schema_version":"1.0","event_id":"sha256:aede41282a85d7e9940303bbfe4b89e573515fa309e1159a5b7a457d1fb30589"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT/bundle.json","state_url":"https://pith.science/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-26T07:08:54Z","links":{"resolver":"https://pith.science/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT","bundle":"https://pith.science/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT/bundle.json","state":"https://pith.science/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4NJBO4Q42TVQJ5RXDLWNH6RSDT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:4NJBO4Q42TVQJ5RXDLWNH6RSDT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3bd2b0a37feb2772cc8b307ea41a0ed67b80fcfebf1882e039a3ed90e2af1ebf","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-04-17T04:43:05Z","title_canon_sha256":"edc074be2dbb97340a7adaf9c71bfce1135642d44e8a8a669569220869bc14b1"},"schema_version":"1.0","source":{"id":"1704.04866","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1704.04866","created_at":"2026-05-18T00:44:08Z"},{"alias_kind":"arxiv_version","alias_value":"1704.04866v3","created_at":"2026-05-18T00:44:08Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1704.04866","created_at":"2026-05-18T00:44:08Z"},{"alias_kind":"pith_short_12","alias_value":"4NJBO4Q42TVQ","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_16","alias_value":"4NJBO4Q42TVQJ5RX","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_8","alias_value":"4NJBO4Q4","created_at":"2026-05-18T12:31:00Z"}],"graph_snapshots":[{"event_id":"sha256:aede41282a85d7e9940303bbfe4b89e573515fa309e1159a5b7a457d1fb30589","target":"graph","created_at":"2026-05-18T00:44:08Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Online reinforcement learning (RL) is increasingly popular for the personalized mobile health (mHealth) intervention. It is able to personalize the type and dose of interventions according to user's ongoing statuses and changing needs. However, at the beginning of online learning, there are usually too few samples to support the RL updating, which leads to poor performances. A delay in good performance of the online learning algorithms can be especially detrimental in the mHealth, where users tend to quickly disengage with the mHealth app. To address this problem, we propose a new online RL me","authors_text":"Feiyun Zhu, Peng Liao","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-04-17T04:43:05Z","title":"Effective Warm Start for the Online Actor-Critic Reinforcement Learning based mHealth Intervention"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1704.04866","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fe18f5b106a0167b27dea5f2e1d89398b2acb3f4342177b67721b68b834d03e6","target":"record","created_at":"2026-05-18T00:44:08Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3bd2b0a37feb2772cc8b307ea41a0ed67b80fcfebf1882e039a3ed90e2af1ebf","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-04-17T04:43:05Z","title_canon_sha256":"edc074be2dbb97340a7adaf9c71bfce1135642d44e8a8a669569220869bc14b1"},"schema_version":"1.0","source":{"id":"1704.04866","kind":"arxiv","version":3}},"canonical_sha256":"e35217721cd4eb04f6371aecd3fa321cf6644905d5fa79e9af50abf99584d579","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e35217721cd4eb04f6371aecd3fa321cf6644905d5fa79e9af50abf99584d579","first_computed_at":"2026-05-18T00:44:08.608086Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:44:08.608086Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"enYOYovk+l38Y2A0aX2bYTvyfBDaeaLDwbrjK6lnAp0hKYuxc5uHPLW7wGaQLPClZE/ZSgKPdbAFijRs370OBA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:44:08.608580Z","signed_message":"canonical_sha256_bytes"},"source_id":"1704.04866","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fe18f5b106a0167b27dea5f2e1d89398b2acb3f4342177b67721b68b834d03e6","sha256:aede41282a85d7e9940303bbfe4b89e573515fa309e1159a5b7a457d1fb30589"],"state_sha256":"edc8987c0d704e89c9e4f93a848b643b0d9dd604327ada2f170eec5abe16b41f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YODJIEug4rxaA1jAPhn8eejrUgrtHdC8a6D50TdF8UAuHTKj6GNMzNvU8lTBpICVr/KptFThXSKIfcCfK9sTDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-26T07:08:54.802840Z","bundle_sha256":"a2f49cac9d50a48b8f5eadd423d21a57909877aba7a490b22def6685681dc9dd"}}