{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:UA6AYC3AYU4J6UXNRIPZD25W3W","short_pith_number":"pith:UA6AYC3A","canonical_record":{"source":{"id":"1801.09319","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"physics.comp-ph","submitted_at":"2018-01-28T23:48:01Z","cross_cats_sorted":["cs.LG","physics.chem-ph","stat.ML"],"title_canon_sha256":"623a7b3b04fda03a2de273a64a01a1bbbb8ac9593bea1e6e6da75bcdb43d79e5","abstract_canon_sha256":"6f51663a6ef203e272dd7c90b89a4ac06064c1ab9063f605338244b46af355f8"},"schema_version":"1.0"},"canonical_sha256":"a03c0c0b60c5389f52ed8a1f91ebb6dda079515b69ca2bdb5d5bba3843a61e6c","source":{"kind":"arxiv","id":"1801.09319","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1801.09319","created_at":"2026-05-18T00:15:05Z"},{"alias_kind":"arxiv_version","alias_value":"1801.09319v2","created_at":"2026-05-18T00:15:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.09319","created_at":"2026-05-18T00:15:05Z"},{"alias_kind":"pith_short_12","alias_value":"UA6AYC3AYU4J","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"UA6AYC3AYU4J6UXN","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"UA6AYC3A","created_at":"2026-05-18T12:32:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:UA6AYC3AYU4J6UXNRIPZD25W3W","target":"record","payload":{"canonical_record":{"source":{"id":"1801.09319","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"physics.comp-ph","submitted_at":"2018-01-28T23:48:01Z","cross_cats_sorted":["cs.LG","physics.chem-ph","stat.ML"],"title_canon_sha256":"623a7b3b04fda03a2de273a64a01a1bbbb8ac9593bea1e6e6da75bcdb43d79e5","abstract_canon_sha256":"6f51663a6ef203e272dd7c90b89a4ac06064c1ab9063f605338244b46af355f8"},"schema_version":"1.0"},"canonical_sha256":"a03c0c0b60c5389f52ed8a1f91ebb6dda079515b69ca2bdb5d5bba3843a61e6c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:05.011554Z","signature_b64":"gElwumkl6kaelTYkOBdtxy7gxvQl789yp/UhJ5Qa2Y6y46HiKGkW4TQazIpJmtwNUEOmRHMBpyMqmnbjRySHDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a03c0c0b60c5389f52ed8a1f91ebb6dda079515b69ca2bdb5d5bba3843a61e6c","last_reissued_at":"2026-05-18T00:15:05.011000Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:05.011000Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1801.09319","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hPgIk+XENxSfbIg5euFzhpLAvmfsWmpMrXsO8iH9cQfY+dQuqMoA6BEGFysVvaBG78Xs6ue1r6rvTTSjE6A9BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-25T12:23:11.166453Z"},"content_sha256":"540444c7f650c03b399b6fd74882720cb4f0c2a79e868d5a0a701ce6b6e7120e","schema_version":"1.0","event_id":"sha256:540444c7f650c03b399b6fd74882720cb4f0c2a79e868d5a0a701ce6b6e7120e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:UA6AYC3AYU4J6UXNRIPZD25W3W","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Less is more: sampling chemical space with active learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","physics.chem-ph","stat.ML"],"primary_cat":"physics.comp-ph","authors_text":"Adrian E. Roitberg, Ben Nebgen, Justin S. Smith, Nicholas Lubbers, Olexandr Isayev","submitted_at":"2018-01-28T23:48:01Z","abstract_excerpt":"The development of accurate and transferable machine learning (ML) potentials for predicting molecular energetics is a challenging task. The process of data generation to train such ML potentials is a task neither well understood nor researched in detail. In this work, we present a fully automated approach for the generation of datasets with the intent of training universal ML potentials. It is based on the concept of active learning (AL) via Query by Committee (QBC), which uses the disagreement between an ensemble of ML potentials to infer the reliability of the ensemble's prediction. QBC all"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.09319","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:05Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"L6anR1+iKnERzZ84PpNSgu3BexLW6BrYgcWPA5244bHUVRtCN6e3RQEcCA5DgR6Dhna6MujHyCxqEB/O9x55Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-25T12:23:11.166799Z"},"content_sha256":"138733691bfcbafb64c2f0fb77497ea64851f62663333bbbb44398431ac8e24a","schema_version":"1.0","event_id":"sha256:138733691bfcbafb64c2f0fb77497ea64851f62663333bbbb44398431ac8e24a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/UA6AYC3AYU4J6UXNRIPZD25W3W/bundle.json","state_url":"https://pith.science/pith/UA6AYC3AYU4J6UXNRIPZD25W3W/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/UA6AYC3AYU4J6UXNRIPZD25W3W/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-25T12:23:11Z","links":{"resolver":"https://pith.science/pith/UA6AYC3AYU4J6UXNRIPZD25W3W","bundle":"https://pith.science/pith/UA6AYC3AYU4J6UXNRIPZD25W3W/bundle.json","state":"https://pith.science/pith/UA6AYC3AYU4J6UXNRIPZD25W3W/state.json","well_known_bundle":"https://pith.science/.well-known/pith/UA6AYC3AYU4J6UXNRIPZD25W3W/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:UA6AYC3AYU4J6UXNRIPZD25W3W","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6f51663a6ef203e272dd7c90b89a4ac06064c1ab9063f605338244b46af355f8","cross_cats_sorted":["cs.LG","physics.chem-ph","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"physics.comp-ph","submitted_at":"2018-01-28T23:48:01Z","title_canon_sha256":"623a7b3b04fda03a2de273a64a01a1bbbb8ac9593bea1e6e6da75bcdb43d79e5"},"schema_version":"1.0","source":{"id":"1801.09319","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1801.09319","created_at":"2026-05-18T00:15:05Z"},{"alias_kind":"arxiv_version","alias_value":"1801.09319v2","created_at":"2026-05-18T00:15:05Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.09319","created_at":"2026-05-18T00:15:05Z"},{"alias_kind":"pith_short_12","alias_value":"UA6AYC3AYU4J","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_16","alias_value":"UA6AYC3AYU4J6UXN","created_at":"2026-05-18T12:32:56Z"},{"alias_kind":"pith_short_8","alias_value":"UA6AYC3A","created_at":"2026-05-18T12:32:56Z"}],"graph_snapshots":[{"event_id":"sha256:138733691bfcbafb64c2f0fb77497ea64851f62663333bbbb44398431ac8e24a","target":"graph","created_at":"2026-05-18T00:15:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The development of accurate and transferable machine learning (ML) potentials for predicting molecular energetics is a challenging task. The process of data generation to train such ML potentials is a task neither well understood nor researched in detail. In this work, we present a fully automated approach for the generation of datasets with the intent of training universal ML potentials. It is based on the concept of active learning (AL) via Query by Committee (QBC), which uses the disagreement between an ensemble of ML potentials to infer the reliability of the ensemble's prediction. QBC all","authors_text":"Adrian E. Roitberg, Ben Nebgen, Justin S. Smith, Nicholas Lubbers, Olexandr Isayev","cross_cats":["cs.LG","physics.chem-ph","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"physics.comp-ph","submitted_at":"2018-01-28T23:48:01Z","title":"Less is more: sampling chemical space with active learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.09319","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:540444c7f650c03b399b6fd74882720cb4f0c2a79e868d5a0a701ce6b6e7120e","target":"record","created_at":"2026-05-18T00:15:05Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6f51663a6ef203e272dd7c90b89a4ac06064c1ab9063f605338244b46af355f8","cross_cats_sorted":["cs.LG","physics.chem-ph","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"physics.comp-ph","submitted_at":"2018-01-28T23:48:01Z","title_canon_sha256":"623a7b3b04fda03a2de273a64a01a1bbbb8ac9593bea1e6e6da75bcdb43d79e5"},"schema_version":"1.0","source":{"id":"1801.09319","kind":"arxiv","version":2}},"canonical_sha256":"a03c0c0b60c5389f52ed8a1f91ebb6dda079515b69ca2bdb5d5bba3843a61e6c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a03c0c0b60c5389f52ed8a1f91ebb6dda079515b69ca2bdb5d5bba3843a61e6c","first_computed_at":"2026-05-18T00:15:05.011000Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:15:05.011000Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"gElwumkl6kaelTYkOBdtxy7gxvQl789yp/UhJ5Qa2Y6y46HiKGkW4TQazIpJmtwNUEOmRHMBpyMqmnbjRySHDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:15:05.011554Z","signed_message":"canonical_sha256_bytes"},"source_id":"1801.09319","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:540444c7f650c03b399b6fd74882720cb4f0c2a79e868d5a0a701ce6b6e7120e","sha256:138733691bfcbafb64c2f0fb77497ea64851f62663333bbbb44398431ac8e24a"],"state_sha256":"3e404f0fe3d0dbe33c9e288d60dc00035a2d4b7c1b0b3e825817514065b77835"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+rQLzhQxpgZwbRMBtBfxt6/qmA0GojQVoYhNQq+Lix7nIde7PoPpQMdzodB1FY5soiI8FXNtBWGF79us9a7PBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-25T12:23:11.168691Z","bundle_sha256":"39fab8b34a3fed94de5dd87cb482a5765c5651e5a8ccb8cc1ad2ad01f85f4e78"}}