{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2020:JEWTWNYY3PC53D7ARHLPWFRKQ2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f1a781906e2cb8a8267fcc272750f5111091dbed44eb998d1ffb8a8790ee92e3","cross_cats_sorted":["math.ST","stat.ML","stat.TH"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2020-02-12T11:33:46Z","title_canon_sha256":"be08ebb86ed03b4e3e755d69474ba5a22aad80c036b3c85dfb1856481c91ea39"},"schema_version":"1.0","source":{"id":"2002.04926","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2002.04926","created_at":"2026-07-05T01:12:37Z"},{"alias_kind":"arxiv_version","alias_value":"2002.04926v2","created_at":"2026-07-05T01:12:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2002.04926","created_at":"2026-07-05T01:12:37Z"},{"alias_kind":"pith_short_12","alias_value":"JEWTWNYY3PC5","created_at":"2026-07-05T01:12:37Z"},{"alias_kind":"pith_short_16","alias_value":"JEWTWNYY3PC53D7A","created_at":"2026-07-05T01:12:37Z"},{"alias_kind":"pith_short_8","alias_value":"JEWTWNYY","created_at":"2026-07-05T01:12:37Z"}],"graph_snapshots":[{"event_id":"sha256:e7c8ddc26a197bc0a61554d359fc8a213c8c0a6236b6ccbefb2d235c5d35bc45","target":"graph","created_at":"2026-07-05T01:12:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2002.04926/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"A fundamental challenge in contextual bandits is to develop flexible, general-purpose algorithms with computational requirements no worse than classical supervised learning tasks such as classification and regression. Algorithms based on regression have shown promising empirical success, but theoretical guarantees have remained elusive except in special cases. We provide the first universal and optimal reduction from contextual bandits to online regression. We show how to transform any oracle for online regression with a given value function class into an algorithm for contextual bandits with ","authors_text":"Alexander Rakhlin, Dylan J. Foster","cross_cats":["math.ST","stat.ML","stat.TH"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2020-02-12T11:33:46Z","title":"Beyond UCB: Optimal and Efficient Contextual Bandits with Regression Oracles"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2002.04926","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:02886831ab8f28fba7275e1321ce69b3fd31d04cf9f8b43a3cbcd01fa7c27f72","target":"record","created_at":"2026-07-05T01:12:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f1a781906e2cb8a8267fcc272750f5111091dbed44eb998d1ffb8a8790ee92e3","cross_cats_sorted":["math.ST","stat.ML","stat.TH"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2020-02-12T11:33:46Z","title_canon_sha256":"be08ebb86ed03b4e3e755d69474ba5a22aad80c036b3c85dfb1856481c91ea39"},"schema_version":"1.0","source":{"id":"2002.04926","kind":"arxiv","version":2}},"canonical_sha256":"492d3b3718dbc5dd8fe089d6fb162a86813b12feb8ffc5d8d44f25a9affacc4d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"492d3b3718dbc5dd8fe089d6fb162a86813b12feb8ffc5d8d44f25a9affacc4d","first_computed_at":"2026-07-05T01:12:37.388575Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T01:12:37.388575Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"7xEFXJQOFKIZiuVoWQQITaS4nl+6xkcHaKimQPNui0A45fPQmehxAj3s/f45qrfz8oleMuWd2dihPD4Wd7CfAA==","signature_status":"signed_v1","signed_at":"2026-07-05T01:12:37.389084Z","signed_message":"canonical_sha256_bytes"},"source_id":"2002.04926","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:02886831ab8f28fba7275e1321ce69b3fd31d04cf9f8b43a3cbcd01fa7c27f72","sha256:e7c8ddc26a197bc0a61554d359fc8a213c8c0a6236b6ccbefb2d235c5d35bc45"],"state_sha256":"80367d29693d4ac1c653f861bf9cc7200a3ade4e32b2fcfd83e1ed04b02048c9"}