{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:6SPVHHTQFFH3VT4O4UQE5EXE2R","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"fe3d9d3fe7e454fbcdd90f959430fb7b28af5589c52188d5fff462924b05a306","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-04-29T13:11:53Z","title_canon_sha256":"4779010de5f5dcb70c756079349442abf1cbd61f5cd79f31658b265b046a3df2"},"schema_version":"1.0","source":{"id":"2604.26645","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2604.26645","created_at":"2026-05-29T02:05:45Z"},{"alias_kind":"arxiv_version","alias_value":"2604.26645v2","created_at":"2026-05-29T02:05:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2604.26645","created_at":"2026-05-29T02:05:45Z"},{"alias_kind":"pith_short_12","alias_value":"6SPVHHTQFFH3","created_at":"2026-05-29T02:05:45Z"},{"alias_kind":"pith_short_16","alias_value":"6SPVHHTQFFH3VT4O","created_at":"2026-05-29T02:05:45Z"},{"alias_kind":"pith_short_8","alias_value":"6SPVHHTQ","created_at":"2026-05-29T02:05:45Z"}],"graph_snapshots":[{"event_id":"sha256:b53a835a83b9f4fa65e700287f0094c5610f422f0dffda03be0be60866ff7161","target":"graph","created_at":"2026-05-29T02:05:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"We propose SciHorizon-DataEVA, a novel agentic system to scalable AI-readiness evaluation of heterogeneous scientific data... Extensive experiments on scientific datasets spanning multiple domains demonstrate the effectiveness and generality of SciHorizon-DataEVA for principled AI-readiness evaluation."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That the Sci-TQA2 principles can be decomposed into measurable atomic elements and that the hierarchical multi-agent workflow with dynamic specification construction and self-correction will produce reliable, generalizable assessments across heterogeneous data without domain-specific failures or high error rates."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"SciHorizon-DataEVA is a hierarchical multi-agent system that applies Sci-TQA2 principles to assess AI-readiness of heterogeneous scientific data through dynamic evaluation specifications and adaptive tool use."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"SciHorizon-DataEVA is an agentic system that enables scalable AI-readiness evaluation of heterogeneous scientific data by defining Sci-TQA2 principles and executing them through a hierarchical multi-agent workflow."}],"snapshot_sha256":"0bbb0b0064b0cb2e8e905d4f1bef88f51e1ebebd6a3d831ebb0c5d8aeb49b4b0"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-20T23:45:34.345115Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T19:57:53.698058Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2604.26645/integrity.json","findings":[],"snapshot_sha256":"00d8df9ae65e7a8617fe3b479a78fe5bf89d320875f115a102645cbaa8459d19","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"AI-for-Science (AI4Science) is increasingly transforming scientific discovery by embedding machine learning models into prediction, simulation, and hypothesis generation workflows across domains. However, the effectiveness of these models is fundamentally constrained by the AI-readiness of scientific data, for which no scalable and systematic evaluation mechanism currently exists. In this work, we propose SciHorizon-DataEVA, a novel agentic system to scalable AI-readiness evaluation of heterogeneous scientific data. At the evaluation-criteria level, we introduce the Sci-TQA2 principles, which ","authors_text":"Chuan Qin, Dianyu Liu, Hengshu Zhu, Wenxi Xu, Xiaohan Li, Xi Chen, Xin Chen, Yuanchun Zhou, Yuyang Wang","cross_cats":["cs.LG"],"headline":"SciHorizon-DataEVA is an agentic system that enables scalable AI-readiness evaluation of heterogeneous scientific data by defining Sci-TQA2 principles and executing them through a hierarchical multi-agent workflow.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-04-29T13:11:53Z","title":"SciHorizon-DataEVA: An Agentic System for AI-Readiness Evaluation of Heterogeneous Scientific Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2604.26645","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-07T10:48:34.031123Z","id":"c6534f1c-fcac-47b7-9036-7d060cb1624c","model_set":{"reader":"grok-4.3"},"one_line_summary":"SciHorizon-DataEVA is a hierarchical multi-agent system that applies Sci-TQA2 principles to assess AI-readiness of heterogeneous scientific data through dynamic evaluation specifications and adaptive tool use.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"SciHorizon-DataEVA is an agentic system that enables scalable AI-readiness evaluation of heterogeneous scientific data by defining Sci-TQA2 principles and executing them through a hierarchical multi-agent workflow.","strongest_claim":"We propose SciHorizon-DataEVA, a novel agentic system to scalable AI-readiness evaluation of heterogeneous scientific data... Extensive experiments on scientific datasets spanning multiple domains demonstrate the effectiveness and generality of SciHorizon-DataEVA for principled AI-readiness evaluation.","weakest_assumption":"That the Sci-TQA2 principles can be decomposed into measurable atomic elements and that the hierarchical multi-agent workflow with dynamic specification construction and self-correction will produce reliable, generalizable assessments across heterogeneous data without domain-specific failures or high error rates."}},"verdict_id":"c6534f1c-fcac-47b7-9036-7d060cb1624c"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:89a29beefde31852438e8bb1f0a59a466204638b1969055b44382d1c94aef829","target":"record","created_at":"2026-05-29T02:05:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"fe3d9d3fe7e454fbcdd90f959430fb7b28af5589c52188d5fff462924b05a306","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-04-29T13:11:53Z","title_canon_sha256":"4779010de5f5dcb70c756079349442abf1cbd61f5cd79f31658b265b046a3df2"},"schema_version":"1.0","source":{"id":"2604.26645","kind":"arxiv","version":2}},"canonical_sha256":"f49f539e70294fbacf8ee5204e92e4d45b643614da0e238c077890b8b1f33d20","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f49f539e70294fbacf8ee5204e92e4d45b643614da0e238c077890b8b1f33d20","first_computed_at":"2026-05-29T02:05:45.346514Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T02:05:45.346514Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"KcLpVp1sn8zh4ubLo0BkuuD093DgXgm3PrtxhgI0QNgx/C2ewK0slYlYJBDSJkTAJi1qceHhS/4APsP3k5L2Bg==","signature_status":"signed_v1","signed_at":"2026-05-29T02:05:45.347350Z","signed_message":"canonical_sha256_bytes"},"source_id":"2604.26645","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:89a29beefde31852438e8bb1f0a59a466204638b1969055b44382d1c94aef829","sha256:b53a835a83b9f4fa65e700287f0094c5610f422f0dffda03be0be60866ff7161"],"state_sha256":"9bf1cfb833cc2cbb9555faac134b68f6e78b2867c978580b396602dccd67d41e"}