{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:3KCLQBMYJ6AMFGY4J2GJ676ZJD","short_pith_number":"pith:3KCLQBMY","canonical_record":{"source":{"id":"2606.07929","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-06T01:39:14Z","cross_cats_sorted":[],"title_canon_sha256":"fb6b477441842e01ee1cdc191abfa7f1073329757ae20414c0fdfc2c992a5144","abstract_canon_sha256":"c80d69c98e980fe13798e6a04120911c4f97802557b6b7780b26295608c57de2"},"schema_version":"1.0"},"canonical_sha256":"da84b805984f80c29b1c4e8c9f7fd948fee2f905392e586c9d29c1d5903bcfb4","source":{"kind":"arxiv","id":"2606.07929","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07929","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07929v1","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07929","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"pith_short_12","alias_value":"3KCLQBMYJ6AM","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"pith_short_16","alias_value":"3KCLQBMYJ6AMFGY4","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"pith_short_8","alias_value":"3KCLQBMY","created_at":"2026-06-09T01:04:55Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:3KCLQBMYJ6AMFGY4J2GJ676ZJD","target":"record","payload":{"canonical_record":{"source":{"id":"2606.07929","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-06T01:39:14Z","cross_cats_sorted":[],"title_canon_sha256":"fb6b477441842e01ee1cdc191abfa7f1073329757ae20414c0fdfc2c992a5144","abstract_canon_sha256":"c80d69c98e980fe13798e6a04120911c4f97802557b6b7780b26295608c57de2"},"schema_version":"1.0"},"canonical_sha256":"da84b805984f80c29b1c4e8c9f7fd948fee2f905392e586c9d29c1d5903bcfb4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T01:04:55.697137Z","signature_b64":"S5i5gbBfDQ0lbItqIg60jhF1geRtJzqLcU89BYePMuB7EHPbQ7ExSByVNSbol0q0CPj+C1ddz2nATQMf59rNCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"da84b805984f80c29b1c4e8c9f7fd948fee2f905392e586c9d29c1d5903bcfb4","last_reissued_at":"2026-06-09T01:04:55.696739Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T01:04:55.696739Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.07929","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:04:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"X3ninTjeJxIzt14DEcGiK4A/L2B/0Rp7CCCrRmY+BfF2yl/4+3RkHCXFn4hlzVl28VaFZA4z3kKolUX93z9GBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T15:26:21.599213Z"},"content_sha256":"b577a7c093b91b83e8df5b3c9dc09e7cdda5f2b42a34625b61c1d76966042b23","schema_version":"1.0","event_id":"sha256:b577a7c093b91b83e8df5b3c9dc09e7cdda5f2b42a34625b61c1d76966042b23"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:3KCLQBMYJ6AMFGY4J2GJ676ZJD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Stress-testing medical large language models reveals latent safety pathology beyond benchmark accuracy","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Linghua Yu, Xiaojun Wu, Yuan Shen","submitted_at":"2026-06-06T01:39:14Z","abstract_excerpt":"Large language models (LLMs) are entering clinical practice based on benchmark accuracy that may fail to detect safety-relevant failure modes. Here we present AI-MASLD, a stress-audit framework that adapts the logic of metabolic stress testing from hepatology to the evaluation of clinical LLMs. Using 240 clinical cases across six narrative perturbation probes, we subjected seven models to double-stress testing and quantified performance through three indices: metabolic index (MI), perturbation flip rate (PFR), and counterfactual fairness index (CFI). Under clean baseline conditions, all models"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07929","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.07929/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:04:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pthKdjO0p/KOxEl6L5akicO1ln1qt79s4lI1dZAJHmx7zkU4jOVOzTi3xzfwVH/FXREd5hTHIUmsWWgH92XxBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T15:26:21.599600Z"},"content_sha256":"afc6f96c32766f640c80c9c11b0e97709d41ffb1c03ae891cb758f3b31f3893a","schema_version":"1.0","event_id":"sha256:afc6f96c32766f640c80c9c11b0e97709d41ffb1c03ae891cb758f3b31f3893a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD/bundle.json","state_url":"https://pith.science/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T15:26:21Z","links":{"resolver":"https://pith.science/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD","bundle":"https://pith.science/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD/bundle.json","state":"https://pith.science/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3KCLQBMYJ6AMFGY4J2GJ676ZJD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:3KCLQBMYJ6AMFGY4J2GJ676ZJD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c80d69c98e980fe13798e6a04120911c4f97802557b6b7780b26295608c57de2","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-06T01:39:14Z","title_canon_sha256":"fb6b477441842e01ee1cdc191abfa7f1073329757ae20414c0fdfc2c992a5144"},"schema_version":"1.0","source":{"id":"2606.07929","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07929","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07929v1","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07929","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"pith_short_12","alias_value":"3KCLQBMYJ6AM","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"pith_short_16","alias_value":"3KCLQBMYJ6AMFGY4","created_at":"2026-06-09T01:04:55Z"},{"alias_kind":"pith_short_8","alias_value":"3KCLQBMY","created_at":"2026-06-09T01:04:55Z"}],"graph_snapshots":[{"event_id":"sha256:afc6f96c32766f640c80c9c11b0e97709d41ffb1c03ae891cb758f3b31f3893a","target":"graph","created_at":"2026-06-09T01:04:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.07929/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large language models (LLMs) are entering clinical practice based on benchmark accuracy that may fail to detect safety-relevant failure modes. Here we present AI-MASLD, a stress-audit framework that adapts the logic of metabolic stress testing from hepatology to the evaluation of clinical LLMs. Using 240 clinical cases across six narrative perturbation probes, we subjected seven models to double-stress testing and quantified performance through three indices: metabolic index (MI), perturbation flip rate (PFR), and counterfactual fairness index (CFI). Under clean baseline conditions, all models","authors_text":"Linghua Yu, Xiaojun Wu, Yuan Shen","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-06T01:39:14Z","title":"Stress-testing medical large language models reveals latent safety pathology beyond benchmark accuracy"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07929","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b577a7c093b91b83e8df5b3c9dc09e7cdda5f2b42a34625b61c1d76966042b23","target":"record","created_at":"2026-06-09T01:04:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c80d69c98e980fe13798e6a04120911c4f97802557b6b7780b26295608c57de2","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-06T01:39:14Z","title_canon_sha256":"fb6b477441842e01ee1cdc191abfa7f1073329757ae20414c0fdfc2c992a5144"},"schema_version":"1.0","source":{"id":"2606.07929","kind":"arxiv","version":1}},"canonical_sha256":"da84b805984f80c29b1c4e8c9f7fd948fee2f905392e586c9d29c1d5903bcfb4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"da84b805984f80c29b1c4e8c9f7fd948fee2f905392e586c9d29c1d5903bcfb4","first_computed_at":"2026-06-09T01:04:55.696739Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T01:04:55.696739Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"S5i5gbBfDQ0lbItqIg60jhF1geRtJzqLcU89BYePMuB7EHPbQ7ExSByVNSbol0q0CPj+C1ddz2nATQMf59rNCg==","signature_status":"signed_v1","signed_at":"2026-06-09T01:04:55.697137Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.07929","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b577a7c093b91b83e8df5b3c9dc09e7cdda5f2b42a34625b61c1d76966042b23","sha256:afc6f96c32766f640c80c9c11b0e97709d41ffb1c03ae891cb758f3b31f3893a"],"state_sha256":"e170089ad74986bf4dda7dd6b69068e3e1292b87fdfd2f6548cea9cd1f0df925"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SgQ8RS2h1osnHvPPqI5TaszyX/LIXUbEeEpujhp/5grFwnUiNFV2Fi8bVXoPvUbWmBIA/VnDk46+ufe/BBQCBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T15:26:21.601798Z","bundle_sha256":"703f87d0162c6aeea7bee0999847086782a321b1023a5ca849a27b3397d6e56f"}}