{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:YPXVKQQJR4Q5TYPTDXJ2G3LCMP","short_pith_number":"pith:YPXVKQQJ","canonical_record":{"source":{"id":"2606.24460","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-23T11:47:03Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"86f485a2006769baeb929a5e194f5d7caa5295c76e9152b48f5901562e7ce016","abstract_canon_sha256":"6e7d6487bdb21ab238eb94b3a6093250fa1164ec86b2f0461abfa4ec4acadbb7"},"schema_version":"1.0"},"canonical_sha256":"c3ef5542098f21d9e1f31dd3a36d6263f954b6e9229c52f3e5a232ec2ec50aec","source":{"kind":"arxiv","id":"2606.24460","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24460","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24460v1","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24460","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_12","alias_value":"YPXVKQQJR4Q5","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_16","alias_value":"YPXVKQQJR4Q5TYPT","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_8","alias_value":"YPXVKQQJ","created_at":"2026-06-24T01:15:31Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:YPXVKQQJR4Q5TYPTDXJ2G3LCMP","target":"record","payload":{"canonical_record":{"source":{"id":"2606.24460","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-23T11:47:03Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"86f485a2006769baeb929a5e194f5d7caa5295c76e9152b48f5901562e7ce016","abstract_canon_sha256":"6e7d6487bdb21ab238eb94b3a6093250fa1164ec86b2f0461abfa4ec4acadbb7"},"schema_version":"1.0"},"canonical_sha256":"c3ef5542098f21d9e1f31dd3a36d6263f954b6e9229c52f3e5a232ec2ec50aec","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-24T01:15:31.018350Z","signature_b64":"ROa9HSSvRJVb+Mxaea1sVjW+MmwmI5z9goUX8gqbxuVxmm+nAJJ6h0dhl8OpewmadyjWbGHqR/+uc4PPpvakAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c3ef5542098f21d9e1f31dd3a36d6263f954b6e9229c52f3e5a232ec2ec50aec","last_reissued_at":"2026-06-24T01:15:31.017993Z","signature_status":"signed_v1","first_computed_at":"2026-06-24T01:15:31.017993Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.24460","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:15:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DVjbw6oeR2d0R0iaJ0djDsO+dJ8CAn0dVl4k+vwp8Jk5pscDszZk9SvxIM+8ruzlmsoMLQvUhIA2NpW+H5NbDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-29T15:42:14.032513Z"},"content_sha256":"4c2a7e29295678677d97ff37a8ea50049c0528f7ed20c28075ec197f1a69e3f1","schema_version":"1.0","event_id":"sha256:4c2a7e29295678677d97ff37a8ea50049c0528f7ed20c28075ec197f1a69e3f1"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:YPXVKQQJR4Q5TYPTDXJ2G3LCMP","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"The African Language Tax: Quantifying the Cost, Latency, and Context Penalty of Tokenizing African Languages in Frontier LLMs","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"Olaoye Anthony Somide","submitted_at":"2026-06-23T11:47:03Z","abstract_excerpt":"Commercial large language models bill, scale latency, and budget context per token. Yet tokenizers assign more subword tokens to the same meaning in some languages than in others, so speakers of languages with high token-fertility pay a structural penalty before a model is ever invoked. This penalty is documented for multilingual settings in general, but it has not been measured systematically for African languages at the level of enterprise deployment economics and cognitive context capacity. We measure it across 20 African languages spanning five language families and three scripts (Latin, G"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24460","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.24460/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:15:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ppnsEYpCCPBCYqCXpIDGeo8XZiFaOHqzYZHfGShgJJvLcdJUaAD+9gkJ0Y2b1BnmGn5mJO5twvt2B63REM9iDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-29T15:42:14.032881Z"},"content_sha256":"128e4136a349983c0d7f7f5d60849ecfb8123e7c9d037e5c5869645e3c04b44f","schema_version":"1.0","event_id":"sha256:128e4136a349983c0d7f7f5d60849ecfb8123e7c9d037e5c5869645e3c04b44f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP/bundle.json","state_url":"https://pith.science/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-29T15:42:14Z","links":{"resolver":"https://pith.science/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP","bundle":"https://pith.science/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP/bundle.json","state":"https://pith.science/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP/state.json","well_known_bundle":"https://pith.science/.well-known/pith/YPXVKQQJR4Q5TYPTDXJ2G3LCMP/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:YPXVKQQJR4Q5TYPTDXJ2G3LCMP","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6e7d6487bdb21ab238eb94b3a6093250fa1164ec86b2f0461abfa4ec4acadbb7","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-23T11:47:03Z","title_canon_sha256":"86f485a2006769baeb929a5e194f5d7caa5295c76e9152b48f5901562e7ce016"},"schema_version":"1.0","source":{"id":"2606.24460","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24460","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24460v1","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24460","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_12","alias_value":"YPXVKQQJR4Q5","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_16","alias_value":"YPXVKQQJR4Q5TYPT","created_at":"2026-06-24T01:15:31Z"},{"alias_kind":"pith_short_8","alias_value":"YPXVKQQJ","created_at":"2026-06-24T01:15:31Z"}],"graph_snapshots":[{"event_id":"sha256:128e4136a349983c0d7f7f5d60849ecfb8123e7c9d037e5c5869645e3c04b44f","target":"graph","created_at":"2026-06-24T01:15:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.24460/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Commercial large language models bill, scale latency, and budget context per token. Yet tokenizers assign more subword tokens to the same meaning in some languages than in others, so speakers of languages with high token-fertility pay a structural penalty before a model is ever invoked. This penalty is documented for multilingual settings in general, but it has not been measured systematically for African languages at the level of enterprise deployment economics and cognitive context capacity. We measure it across 20 African languages spanning five language families and three scripts (Latin, G","authors_text":"Olaoye Anthony Somide","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-23T11:47:03Z","title":"The African Language Tax: Quantifying the Cost, Latency, and Context Penalty of Tokenizing African Languages in Frontier LLMs"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24460","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4c2a7e29295678677d97ff37a8ea50049c0528f7ed20c28075ec197f1a69e3f1","target":"record","created_at":"2026-06-24T01:15:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6e7d6487bdb21ab238eb94b3a6093250fa1164ec86b2f0461abfa4ec4acadbb7","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-23T11:47:03Z","title_canon_sha256":"86f485a2006769baeb929a5e194f5d7caa5295c76e9152b48f5901562e7ce016"},"schema_version":"1.0","source":{"id":"2606.24460","kind":"arxiv","version":1}},"canonical_sha256":"c3ef5542098f21d9e1f31dd3a36d6263f954b6e9229c52f3e5a232ec2ec50aec","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c3ef5542098f21d9e1f31dd3a36d6263f954b6e9229c52f3e5a232ec2ec50aec","first_computed_at":"2026-06-24T01:15:31.017993Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-24T01:15:31.017993Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ROa9HSSvRJVb+Mxaea1sVjW+MmwmI5z9goUX8gqbxuVxmm+nAJJ6h0dhl8OpewmadyjWbGHqR/+uc4PPpvakAg==","signature_status":"signed_v1","signed_at":"2026-06-24T01:15:31.018350Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.24460","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4c2a7e29295678677d97ff37a8ea50049c0528f7ed20c28075ec197f1a69e3f1","sha256:128e4136a349983c0d7f7f5d60849ecfb8123e7c9d037e5c5869645e3c04b44f"],"state_sha256":"38d70735ef065708644674326f6c26a2f95942fc83bd11c74e2c1861129a3df3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Ex6m0qGVARy1skK68mLynx0DE9nj7ggzObNABMYuo2rR453xrk2s/fnAJUmZ639bzcRErjLSfgDt9WmyMhulCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-29T15:42:14.035514Z","bundle_sha256":"beed94f69ef648058fb6051ca4e84f1e888d008af4c16935955c47f9db08cb55"}}