{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:44HEIP6H6IRUNCSS2F4THWFOHD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a94f677f02fb33aa4fdd875117617664b2a4caec6181cfc36c3befaabf89efa7","cross_cats_sorted":["cs.CR","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T16:18:07Z","title_canon_sha256":"289a2b8101c4ecc460f22eb18690a494b4a2dc039687e06bde148872fe253972"},"schema_version":"1.0","source":{"id":"2605.30162","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.30162","created_at":"2026-05-29T02:06:11Z"},{"alias_kind":"arxiv_version","alias_value":"2605.30162v1","created_at":"2026-05-29T02:06:11Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.30162","created_at":"2026-05-29T02:06:11Z"},{"alias_kind":"pith_short_12","alias_value":"44HEIP6H6IRU","created_at":"2026-05-29T02:06:11Z"},{"alias_kind":"pith_short_16","alias_value":"44HEIP6H6IRUNCSS","created_at":"2026-05-29T02:06:11Z"},{"alias_kind":"pith_short_8","alias_value":"44HEIP6H","created_at":"2026-05-29T02:06:11Z"}],"graph_snapshots":[{"event_id":"sha256:24a226e569941bdb5dba034740ca8ced788806a28003e269964d5a5c4e3c6173","target":"graph","created_at":"2026-05-29T02:06:11Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.30162/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Biosecurity evaluations of language models typically ask whether models produce hazardous output. This paper asks a complementary question: when a model refuses, is that refusal structurally sound, or does it disappear under modest changes to prompt framing, formatting, or output length? Across five architectures, no model cleanly discriminated benign from hazard. Gemma 2 2B-IT never genuinely refused across 75 prompts, hedging on every hazard-adjacent query. Gemma 4 E2B-IT refused 65/75 prompts with chat-template formatting and 0/75 without it. Both Gemma models collapsed to 0% under an 80-to","authors_text":"Caleb DeLeeuw","cross_cats":["cs.CR","cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T16:18:07Z","title":"BioRefusalAudit: Auditing Biosecurity Refusal Depth Using General and Domain-Fine-Tuned Sparse Autoencoders"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.30162","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e6a62e7783461750a6d147587cb63cfb68889ee21d32187b01b9de30d21552b7","target":"record","created_at":"2026-05-29T02:06:11Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a94f677f02fb33aa4fdd875117617664b2a4caec6181cfc36c3befaabf89efa7","cross_cats_sorted":["cs.CR","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-28T16:18:07Z","title_canon_sha256":"289a2b8101c4ecc460f22eb18690a494b4a2dc039687e06bde148872fe253972"},"schema_version":"1.0","source":{"id":"2605.30162","kind":"arxiv","version":1}},"canonical_sha256":"e70e443fc7f223468a52d17933d8ae38c1f4109942406f14d4962ce0fc1f8068","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e70e443fc7f223468a52d17933d8ae38c1f4109942406f14d4962ce0fc1f8068","first_computed_at":"2026-05-29T02:06:11.442153Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T02:06:11.442153Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"iP23VI5yRvWawqjezrlMWmPhp50X4UL83iAftIkuLP0KAbps/RZz73WJsTRP+M4RodpGhGHU4CxMzZz0cMwjDg==","signature_status":"signed_v1","signed_at":"2026-05-29T02:06:11.442556Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.30162","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e6a62e7783461750a6d147587cb63cfb68889ee21d32187b01b9de30d21552b7","sha256:24a226e569941bdb5dba034740ca8ced788806a28003e269964d5a5c4e3c6173"],"state_sha256":"2ca7b5470a9a05174983345fb916f575bde51ffee791e7c7e639bd11cacbb185"}