{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:6HLSDA2EP3CGYUF35K76FKCEZN","short_pith_number":"pith:6HLSDA2E","canonical_record":{"source":{"id":"1810.13033","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-10-30T23:31:50Z","cross_cats_sorted":[],"title_canon_sha256":"83d9e555fcf9f2c97450e9a67e6b73dcd161b1877cb28e4dbb7760ec5c4e6da9","abstract_canon_sha256":"5da7c01b2cd4bdde651c947c119257d3ff440b96d4be24c103295d7ab72a8a1c"},"schema_version":"1.0"},"canonical_sha256":"f1d72183447ec46c50bbeabfe2a844cb6830c32416141c67da10bf2e1167b2bf","source":{"kind":"arxiv","id":"1810.13033","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.13033","created_at":"2026-05-18T00:01:52Z"},{"alias_kind":"arxiv_version","alias_value":"1810.13033v1","created_at":"2026-05-18T00:01:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.13033","created_at":"2026-05-18T00:01:52Z"},{"alias_kind":"pith_short_12","alias_value":"6HLSDA2EP3CG","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_16","alias_value":"6HLSDA2EP3CGYUF3","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_8","alias_value":"6HLSDA2E","created_at":"2026-05-18T12:32:08Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:6HLSDA2EP3CGYUF35K76FKCEZN","target":"record","payload":{"canonical_record":{"source":{"id":"1810.13033","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-10-30T23:31:50Z","cross_cats_sorted":[],"title_canon_sha256":"83d9e555fcf9f2c97450e9a67e6b73dcd161b1877cb28e4dbb7760ec5c4e6da9","abstract_canon_sha256":"5da7c01b2cd4bdde651c947c119257d3ff440b96d4be24c103295d7ab72a8a1c"},"schema_version":"1.0"},"canonical_sha256":"f1d72183447ec46c50bbeabfe2a844cb6830c32416141c67da10bf2e1167b2bf","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:52.425610Z","signature_b64":"WqjNyrj8fhncw+Nw0/0hmRGkwT/kR9pFt9jLCBQJ+PvYJL0OGK0ODj6dNK5qD3vjfE7MBOdQPTO8h+QDL8NgAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f1d72183447ec46c50bbeabfe2a844cb6830c32416141c67da10bf2e1167b2bf","last_reissued_at":"2026-05-18T00:01:52.425011Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:52.425011Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1810.13033","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WKlopVG0p3vYMQ6eYidGIzyIaAkQ+huGFejIKXjmfk5WBDCtlk6sFL94tBZpl4Ir4bl3I/rPXgvAXkluwECfCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T20:11:56.382140Z"},"content_sha256":"470ec1f93c06445cba08ccd9e4b784c88b34ef048dcab0687d295269b695324a","schema_version":"1.0","event_id":"sha256:470ec1f93c06445cba08ccd9e4b784c88b34ef048dcab0687d295269b695324a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:6HLSDA2EP3CGYUF35K76FKCEZN","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Stress-Testing Neural Models of Natural Language Inference with Multiply-Quantified Sentences","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Atticus Geiger, Christopher Potts, Ignacio Cases, Lauri Karttunen","submitted_at":"2018-10-30T23:31:50Z","abstract_excerpt":"Standard evaluations of deep learning models for semantics using naturalistic corpora are limited in what they can tell us about the fidelity of the learned representations, because the corpora rarely come with good measures of semantic complexity. To overcome this limitation, we present a method for generating data sets of multiply-quantified natural language inference (NLI) examples in which semantic complexity can be precisely characterized, and we use this method to show that a variety of common architectures for NLI inevitably fail to encode crucial information; only a model with forced l"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.13033","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:52Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"T9q0HEq8DGIo49lh8SkqWXSnshRYxBSe6y+x9Z8+XpzSm37CS6nyjhSMbhPs2mxWqWlx0yNm82Wq2Q3dcG/KAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T20:11:56.382510Z"},"content_sha256":"4170a029a3bcb0bef311dc01d1cbfb3f072dd08659a6f5113e3f37fa84c66e1c","schema_version":"1.0","event_id":"sha256:4170a029a3bcb0bef311dc01d1cbfb3f072dd08659a6f5113e3f37fa84c66e1c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6HLSDA2EP3CGYUF35K76FKCEZN/bundle.json","state_url":"https://pith.science/pith/6HLSDA2EP3CGYUF35K76FKCEZN/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6HLSDA2EP3CGYUF35K76FKCEZN/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T20:11:56Z","links":{"resolver":"https://pith.science/pith/6HLSDA2EP3CGYUF35K76FKCEZN","bundle":"https://pith.science/pith/6HLSDA2EP3CGYUF35K76FKCEZN/bundle.json","state":"https://pith.science/pith/6HLSDA2EP3CGYUF35K76FKCEZN/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6HLSDA2EP3CGYUF35K76FKCEZN/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:6HLSDA2EP3CGYUF35K76FKCEZN","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5da7c01b2cd4bdde651c947c119257d3ff440b96d4be24c103295d7ab72a8a1c","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-10-30T23:31:50Z","title_canon_sha256":"83d9e555fcf9f2c97450e9a67e6b73dcd161b1877cb28e4dbb7760ec5c4e6da9"},"schema_version":"1.0","source":{"id":"1810.13033","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.13033","created_at":"2026-05-18T00:01:52Z"},{"alias_kind":"arxiv_version","alias_value":"1810.13033v1","created_at":"2026-05-18T00:01:52Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.13033","created_at":"2026-05-18T00:01:52Z"},{"alias_kind":"pith_short_12","alias_value":"6HLSDA2EP3CG","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_16","alias_value":"6HLSDA2EP3CGYUF3","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_8","alias_value":"6HLSDA2E","created_at":"2026-05-18T12:32:08Z"}],"graph_snapshots":[{"event_id":"sha256:4170a029a3bcb0bef311dc01d1cbfb3f072dd08659a6f5113e3f37fa84c66e1c","target":"graph","created_at":"2026-05-18T00:01:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Standard evaluations of deep learning models for semantics using naturalistic corpora are limited in what they can tell us about the fidelity of the learned representations, because the corpora rarely come with good measures of semantic complexity. To overcome this limitation, we present a method for generating data sets of multiply-quantified natural language inference (NLI) examples in which semantic complexity can be precisely characterized, and we use this method to show that a variety of common architectures for NLI inevitably fail to encode crucial information; only a model with forced l","authors_text":"Atticus Geiger, Christopher Potts, Ignacio Cases, Lauri Karttunen","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-10-30T23:31:50Z","title":"Stress-Testing Neural Models of Natural Language Inference with Multiply-Quantified Sentences"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.13033","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:470ec1f93c06445cba08ccd9e4b784c88b34ef048dcab0687d295269b695324a","target":"record","created_at":"2026-05-18T00:01:52Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5da7c01b2cd4bdde651c947c119257d3ff440b96d4be24c103295d7ab72a8a1c","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-10-30T23:31:50Z","title_canon_sha256":"83d9e555fcf9f2c97450e9a67e6b73dcd161b1877cb28e4dbb7760ec5c4e6da9"},"schema_version":"1.0","source":{"id":"1810.13033","kind":"arxiv","version":1}},"canonical_sha256":"f1d72183447ec46c50bbeabfe2a844cb6830c32416141c67da10bf2e1167b2bf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f1d72183447ec46c50bbeabfe2a844cb6830c32416141c67da10bf2e1167b2bf","first_computed_at":"2026-05-18T00:01:52.425011Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:01:52.425011Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"WqjNyrj8fhncw+Nw0/0hmRGkwT/kR9pFt9jLCBQJ+PvYJL0OGK0ODj6dNK5qD3vjfE7MBOdQPTO8h+QDL8NgAg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:01:52.425610Z","signed_message":"canonical_sha256_bytes"},"source_id":"1810.13033","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:470ec1f93c06445cba08ccd9e4b784c88b34ef048dcab0687d295269b695324a","sha256:4170a029a3bcb0bef311dc01d1cbfb3f072dd08659a6f5113e3f37fa84c66e1c"],"state_sha256":"b76fa94fa7df8dda0960038a6b5e06cee90292dfac99877c16aea4cb48f9a296"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2UUZrG9ZMVyDoF9Hw8cVykzF+xFPoQVtq1m054vVfseAN8qTJA0RgQPbBKSlD9UBARFun6Jk7WpLLMuHZjoSCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T20:11:56.384761Z","bundle_sha256":"a86804b459b0fd2a52b2a5ad7d7c583ccf0fb6e6b8900380693796e17628ed76"}}