{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:4ZM6J2T7ED44VNGIBRDU3MRL7R","short_pith_number":"pith:4ZM6J2T7","canonical_record":{"source":{"id":"2606.16000","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-14T19:58:06Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"437aacbd9b2fb9607241b66717fa6a69c64a657a7fddf4cf4e251e1d3939198e","abstract_canon_sha256":"ead18b7c4e88ac5f26ca88a0f30ce43542fa8726f5970d82c8a205f89562028e"},"schema_version":"1.0"},"canonical_sha256":"e659e4ea7f20f9cab4c80c474db22bfc621c4c6c2cf927a9ae7e53fe7b29aeab","source":{"kind":"arxiv","id":"2606.16000","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.16000","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"arxiv_version","alias_value":"2606.16000v2","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.16000","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"pith_short_12","alias_value":"4ZM6J2T7ED44","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"pith_short_16","alias_value":"4ZM6J2T7ED44VNGI","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"pith_short_8","alias_value":"4ZM6J2T7","created_at":"2026-06-19T16:10:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:4ZM6J2T7ED44VNGIBRDU3MRL7R","target":"record","payload":{"canonical_record":{"source":{"id":"2606.16000","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-14T19:58:06Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"437aacbd9b2fb9607241b66717fa6a69c64a657a7fddf4cf4e251e1d3939198e","abstract_canon_sha256":"ead18b7c4e88ac5f26ca88a0f30ce43542fa8726f5970d82c8a205f89562028e"},"schema_version":"1.0"},"canonical_sha256":"e659e4ea7f20f9cab4c80c474db22bfc621c4c6c2cf927a9ae7e53fe7b29aeab","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:10:56.114128Z","signature_b64":"n2Gf5J0H57xK+GvIJjlmi+UnnADW4XXrXefRC6/epjzmZqFnM3W99A42MNFbvmmmHil7yHDP6YGEbEHhECeXBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e659e4ea7f20f9cab4c80c474db22bfc621c4c6c2cf927a9ae7e53fe7b29aeab","last_reissued_at":"2026-06-19T16:10:56.113658Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:10:56.113658Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.16000","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:10:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6cB7iogRxE7eFA3iALUjteEDUQwGYQpDSMb36wUDnPFgz6EcloeMj4l+XuVkLgw8igkIBHmNUr1aZpy/k1xoBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T13:37:53.535697Z"},"content_sha256":"1fc5986b3b7df94794b187b51ebcd24158500a23ad125adffe24c6e96a298d53","schema_version":"1.0","event_id":"sha256:1fc5986b3b7df94794b187b51ebcd24158500a23ad125adffe24c6e96a298d53"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:4ZM6J2T7ED44VNGIBRDU3MRL7R","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"GRACE-DS: a Guarded Reward-guided Agent Correction Environment in Data Science","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Aleksandr Tsymbalov, Anastasiya Palienko, Artem Epifanov, Danis Zaripov","submitted_at":"2026-06-14T19:58:06Z","abstract_excerpt":"We introduce GRACE-DS, a Guarded Reward-guided Agent Correction Environment in Data Science for pre-deployment evaluation of LLM-powered AutoML agents. GRACE-DS is a set of evaluation metrics in an isolated environment that can be applied to tabular ML tasks specific to a particular organization. It exposes agents to realistic workflow stages, from planning and data inspection through feature engineering, model development, validation, and code repair to final submission, while hidden executable validators measure not only final predictive performance but also leakage avoidance, reproducibilit"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.16000","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.16000/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:10:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jjdmkd56XbGY4b5PiekDF3M11P8IttPx/ZUjv4PaV2PMV/AcSn74D/AqcLksQ5zbzP1P0swNf0g13dNDNxO9BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T13:37:53.536100Z"},"content_sha256":"dc00aa725f94d40adebeb9f24dc0d04aad4eea4ffddd43c74359731f3d472a0c","schema_version":"1.0","event_id":"sha256:dc00aa725f94d40adebeb9f24dc0d04aad4eea4ffddd43c74359731f3d472a0c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R/bundle.json","state_url":"https://pith.science/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T13:37:53Z","links":{"resolver":"https://pith.science/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R","bundle":"https://pith.science/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R/bundle.json","state":"https://pith.science/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4ZM6J2T7ED44VNGIBRDU3MRL7R/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:4ZM6J2T7ED44VNGIBRDU3MRL7R","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ead18b7c4e88ac5f26ca88a0f30ce43542fa8726f5970d82c8a205f89562028e","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-14T19:58:06Z","title_canon_sha256":"437aacbd9b2fb9607241b66717fa6a69c64a657a7fddf4cf4e251e1d3939198e"},"schema_version":"1.0","source":{"id":"2606.16000","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.16000","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"arxiv_version","alias_value":"2606.16000v2","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.16000","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"pith_short_12","alias_value":"4ZM6J2T7ED44","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"pith_short_16","alias_value":"4ZM6J2T7ED44VNGI","created_at":"2026-06-19T16:10:56Z"},{"alias_kind":"pith_short_8","alias_value":"4ZM6J2T7","created_at":"2026-06-19T16:10:56Z"}],"graph_snapshots":[{"event_id":"sha256:dc00aa725f94d40adebeb9f24dc0d04aad4eea4ffddd43c74359731f3d472a0c","target":"graph","created_at":"2026-06-19T16:10:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.16000/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We introduce GRACE-DS, a Guarded Reward-guided Agent Correction Environment in Data Science for pre-deployment evaluation of LLM-powered AutoML agents. GRACE-DS is a set of evaluation metrics in an isolated environment that can be applied to tabular ML tasks specific to a particular organization. It exposes agents to realistic workflow stages, from planning and data inspection through feature engineering, model development, validation, and code repair to final submission, while hidden executable validators measure not only final predictive performance but also leakage avoidance, reproducibilit","authors_text":"Aleksandr Tsymbalov, Anastasiya Palienko, Artem Epifanov, Danis Zaripov","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-14T19:58:06Z","title":"GRACE-DS: a Guarded Reward-guided Agent Correction Environment in Data Science"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.16000","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1fc5986b3b7df94794b187b51ebcd24158500a23ad125adffe24c6e96a298d53","target":"record","created_at":"2026-06-19T16:10:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ead18b7c4e88ac5f26ca88a0f30ce43542fa8726f5970d82c8a205f89562028e","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-14T19:58:06Z","title_canon_sha256":"437aacbd9b2fb9607241b66717fa6a69c64a657a7fddf4cf4e251e1d3939198e"},"schema_version":"1.0","source":{"id":"2606.16000","kind":"arxiv","version":2}},"canonical_sha256":"e659e4ea7f20f9cab4c80c474db22bfc621c4c6c2cf927a9ae7e53fe7b29aeab","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e659e4ea7f20f9cab4c80c474db22bfc621c4c6c2cf927a9ae7e53fe7b29aeab","first_computed_at":"2026-06-19T16:10:56.113658Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:10:56.113658Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"n2Gf5J0H57xK+GvIJjlmi+UnnADW4XXrXefRC6/epjzmZqFnM3W99A42MNFbvmmmHil7yHDP6YGEbEHhECeXBA==","signature_status":"signed_v1","signed_at":"2026-06-19T16:10:56.114128Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.16000","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1fc5986b3b7df94794b187b51ebcd24158500a23ad125adffe24c6e96a298d53","sha256:dc00aa725f94d40adebeb9f24dc0d04aad4eea4ffddd43c74359731f3d472a0c"],"state_sha256":"bc11a0b83ca291ed3fa8ded7ad78d388fb277361c88c13a17d9537e9994eda2f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FyJsJDYRgf/ThxaSoS9C5VL/DmD3NEk5XLkINnlWahOR+A6PMgSr6Jygd3OmwikYfiyfJY5/OMqP2zrHj/UMBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T13:37:53.538130Z","bundle_sha256":"3a03b6d21d8199b01c1a607e0db58b004bfa83459d3e42516fd97de46d00a5e7"}}