{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:GYWGFXQOQPQTLEMDDKL4WEQWAN","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f288f1f6c2f0a28d53409b591d37a1889228523e63fa8bb5717ef8e4bde0e063","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-28T16:13:23Z","title_canon_sha256":"8a35298efa2fd56c7cf025031faf4d28936c0a98a2c55be7db941867e4bff9d2"},"schema_version":"1.0","source":{"id":"1703.09700","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.09700","created_at":"2026-05-18T00:12:35Z"},{"alias_kind":"arxiv_version","alias_value":"1703.09700v3","created_at":"2026-05-18T00:12:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.09700","created_at":"2026-05-18T00:12:35Z"},{"alias_kind":"pith_short_12","alias_value":"GYWGFXQOQPQT","created_at":"2026-05-18T12:31:18Z"},{"alias_kind":"pith_short_16","alias_value":"GYWGFXQOQPQTLEMD","created_at":"2026-05-18T12:31:18Z"},{"alias_kind":"pith_short_8","alias_value":"GYWGFXQO","created_at":"2026-05-18T12:31:18Z"}],"graph_snapshots":[{"event_id":"sha256:bd26205bdddfd8dd01075e49bb9164c20b6bc552465ba361294396dc50db867e","target":"graph","created_at":"2026-05-18T00:12:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Inverse reinforcement learning (IRL) aims to explain observed strategic behavior by fitting reinforcement learning models to behavioral data. However, traditional IRL methods are only applicable when the observations are in the form of state-action paths. This assumption may not hold in many real-world modeling settings, where only partial or summarized observations are available. In general, we may assume that there is a summarizing function $\\sigma$, which acts as a filter between us and the true state-action paths that constitute the demonstration. Some initial approaches to extending IRL t","authors_text":"Antti Kangasr\\\"a\\\"asi\\\"o, Samuel Kaski","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-28T16:13:23Z","title":"Inverse Reinforcement Learning from Summary Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.09700","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:39e61d1c9fb3acbf29d6fcca67f96a773bacd02a9c30fd25e249c8e59902a36a","target":"record","created_at":"2026-05-18T00:12:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f288f1f6c2f0a28d53409b591d37a1889228523e63fa8bb5717ef8e4bde0e063","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-03-28T16:13:23Z","title_canon_sha256":"8a35298efa2fd56c7cf025031faf4d28936c0a98a2c55be7db941867e4bff9d2"},"schema_version":"1.0","source":{"id":"1703.09700","kind":"arxiv","version":3}},"canonical_sha256":"362c62de0e83e13591831a97cb1216036b62ec234542a4daea3f057439cae0c9","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"362c62de0e83e13591831a97cb1216036b62ec234542a4daea3f057439cae0c9","first_computed_at":"2026-05-18T00:12:35.490429Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:12:35.490429Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"rODPBmEji+ibHilrtpVcIw3gaR1lRF/TRPNG4gKkQB4t7wo6AIa08kPj4QG3fe0toW5lGQ3Dqj4q4TGyZhM5Bg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:12:35.490993Z","signed_message":"canonical_sha256_bytes"},"source_id":"1703.09700","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:39e61d1c9fb3acbf29d6fcca67f96a773bacd02a9c30fd25e249c8e59902a36a","sha256:bd26205bdddfd8dd01075e49bb9164c20b6bc552465ba361294396dc50db867e"],"state_sha256":"8a64a9e8d3ce6c1d7495d6399d868030fb1eb8f6f3d3609ca520207ae4a5d96a"}