{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:ALK7GNRDTDW7WNVODHIJKBFADA","short_pith_number":"pith:ALK7GNRD","canonical_record":{"source":{"id":"2606.18709","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T05:43:37Z","cross_cats_sorted":[],"title_canon_sha256":"b8b705b2858407e9b3be81a765ab5a56c9228b76ce1911aa2ba17c3f442137e4","abstract_canon_sha256":"e2d764dabf8a2eb76880299096a0199df8e9dcd36f2bc14f84c699cebff5ddfc"},"schema_version":"1.0"},"canonical_sha256":"02d5f3362398edfb36ae19d09504a01818a7505b53f94746f29c55eba737a643","source":{"kind":"arxiv","id":"2606.18709","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.18709","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"arxiv_version","alias_value":"2606.18709v1","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.18709","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"pith_short_12","alias_value":"ALK7GNRDTDW7","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"pith_short_16","alias_value":"ALK7GNRDTDW7WNVO","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"pith_short_8","alias_value":"ALK7GNRD","created_at":"2026-06-19T16:11:45Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:ALK7GNRDTDW7WNVODHIJKBFADA","target":"record","payload":{"canonical_record":{"source":{"id":"2606.18709","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T05:43:37Z","cross_cats_sorted":[],"title_canon_sha256":"b8b705b2858407e9b3be81a765ab5a56c9228b76ce1911aa2ba17c3f442137e4","abstract_canon_sha256":"e2d764dabf8a2eb76880299096a0199df8e9dcd36f2bc14f84c699cebff5ddfc"},"schema_version":"1.0"},"canonical_sha256":"02d5f3362398edfb36ae19d09504a01818a7505b53f94746f29c55eba737a643","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:11:45.251446Z","signature_b64":"0tttD/4fzYxo0vDAdFbogWXvUp6s9U9OlXb6JLX3qj5xnUFYQBjzicQHCTq7RtOqh3fsHEhFA5vN8yzjOFc+AQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"02d5f3362398edfb36ae19d09504a01818a7505b53f94746f29c55eba737a643","last_reissued_at":"2026-06-19T16:11:45.251004Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:11:45.251004Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.18709","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:11:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DLCoZL6EnzTI7v2Vz6G2lY3lwQT1sZh6niJ+pE9vWXEQJ+HSHDorBJP//XoYmfyM+kXFNouaY/bupd7xK12vDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-29T22:21:17.676536Z"},"content_sha256":"b83d7bc1d11c17999ffa437885974e26b522c2ee55932baa754a2fd16d5f7e10","schema_version":"1.0","event_id":"sha256:b83d7bc1d11c17999ffa437885974e26b522c2ee55932baa754a2fd16d5f7e10"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:ALK7GNRDTDW7WNVODHIJKBFADA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"LLMs Struggle to Measure What Distinguishes Students of Different Proficiency Levels: A Study of Item Discrimination in Reading Comprehension Assessment","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Chenguang Wang, Dawei Zhou, Han Chen, Hong Jiao, Ming Li, Tianyi Zhou, Yijun Liang","submitted_at":"2026-06-17T05:43:37Z","abstract_excerpt":"Item discrimination is a fundamental psychometric property of educational assessment, which measures whether an item meaningfully distinguishes students with higher proficiency from students with lower proficiency. While various existing works have explored whether large language models (LLMs) can estimate item difficulty, it remains unclear whether they can capture item discrimination. In this work, we evaluate 42 proprietary and open-weight LLMs in zero-shot settings using two complementary approaches: direct discrimination prediction, where models explicitly estimate an item's discriminatio"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.18709","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.18709/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:11:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8AswOdkNNNvmNX4F1fyB5NPxeB/CVMl7OfE+HJy1/+MXG2TlpToa9YfLfY4hX9+aQqX9HVnUbDBmcILN6NjuAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-29T22:21:17.676898Z"},"content_sha256":"dc6961e2d1a55c35c7abb04ce1012065b800da150e0160df473ad64d91913edf","schema_version":"1.0","event_id":"sha256:dc6961e2d1a55c35c7abb04ce1012065b800da150e0160df473ad64d91913edf"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ALK7GNRDTDW7WNVODHIJKBFADA/bundle.json","state_url":"https://pith.science/pith/ALK7GNRDTDW7WNVODHIJKBFADA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ALK7GNRDTDW7WNVODHIJKBFADA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-29T22:21:17Z","links":{"resolver":"https://pith.science/pith/ALK7GNRDTDW7WNVODHIJKBFADA","bundle":"https://pith.science/pith/ALK7GNRDTDW7WNVODHIJKBFADA/bundle.json","state":"https://pith.science/pith/ALK7GNRDTDW7WNVODHIJKBFADA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ALK7GNRDTDW7WNVODHIJKBFADA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ALK7GNRDTDW7WNVODHIJKBFADA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e2d764dabf8a2eb76880299096a0199df8e9dcd36f2bc14f84c699cebff5ddfc","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T05:43:37Z","title_canon_sha256":"b8b705b2858407e9b3be81a765ab5a56c9228b76ce1911aa2ba17c3f442137e4"},"schema_version":"1.0","source":{"id":"2606.18709","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.18709","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"arxiv_version","alias_value":"2606.18709v1","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.18709","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"pith_short_12","alias_value":"ALK7GNRDTDW7","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"pith_short_16","alias_value":"ALK7GNRDTDW7WNVO","created_at":"2026-06-19T16:11:45Z"},{"alias_kind":"pith_short_8","alias_value":"ALK7GNRD","created_at":"2026-06-19T16:11:45Z"}],"graph_snapshots":[{"event_id":"sha256:dc6961e2d1a55c35c7abb04ce1012065b800da150e0160df473ad64d91913edf","target":"graph","created_at":"2026-06-19T16:11:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.18709/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Item discrimination is a fundamental psychometric property of educational assessment, which measures whether an item meaningfully distinguishes students with higher proficiency from students with lower proficiency. While various existing works have explored whether large language models (LLMs) can estimate item difficulty, it remains unclear whether they can capture item discrimination. In this work, we evaluate 42 proprietary and open-weight LLMs in zero-shot settings using two complementary approaches: direct discrimination prediction, where models explicitly estimate an item's discriminatio","authors_text":"Chenguang Wang, Dawei Zhou, Han Chen, Hong Jiao, Ming Li, Tianyi Zhou, Yijun Liang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T05:43:37Z","title":"LLMs Struggle to Measure What Distinguishes Students of Different Proficiency Levels: A Study of Item Discrimination in Reading Comprehension Assessment"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.18709","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b83d7bc1d11c17999ffa437885974e26b522c2ee55932baa754a2fd16d5f7e10","target":"record","created_at":"2026-06-19T16:11:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e2d764dabf8a2eb76880299096a0199df8e9dcd36f2bc14f84c699cebff5ddfc","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-06-17T05:43:37Z","title_canon_sha256":"b8b705b2858407e9b3be81a765ab5a56c9228b76ce1911aa2ba17c3f442137e4"},"schema_version":"1.0","source":{"id":"2606.18709","kind":"arxiv","version":1}},"canonical_sha256":"02d5f3362398edfb36ae19d09504a01818a7505b53f94746f29c55eba737a643","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"02d5f3362398edfb36ae19d09504a01818a7505b53f94746f29c55eba737a643","first_computed_at":"2026-06-19T16:11:45.251004Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:11:45.251004Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"0tttD/4fzYxo0vDAdFbogWXvUp6s9U9OlXb6JLX3qj5xnUFYQBjzicQHCTq7RtOqh3fsHEhFA5vN8yzjOFc+AQ==","signature_status":"signed_v1","signed_at":"2026-06-19T16:11:45.251446Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.18709","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b83d7bc1d11c17999ffa437885974e26b522c2ee55932baa754a2fd16d5f7e10","sha256:dc6961e2d1a55c35c7abb04ce1012065b800da150e0160df473ad64d91913edf"],"state_sha256":"d7b2940fb8e516290111f4ac0f6f8fdbffb44947f197109dfd0a8884d08a4f17"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kU9qJjBmUxKLN7PssJ70n8B7N+h6a6IuKcwz7Nh6vYLzvFNNsQmMw0eW6fdmV/maZfQAMmnehW4rcx6yZlGiDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-29T22:21:17.678862Z","bundle_sha256":"b6397c7c79d293989103b00ad1b3d558a784a17bcc91a5d061ed3b0e0c61698a"}}