{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2021:NMB7QKC2NJYNHLPG6XMF2N35IK","short_pith_number":"pith:NMB7QKC2","canonical_record":{"source":{"id":"2109.10465","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2021-09-22T00:57:46Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"1081b2af858259c4909b86775021934b23d9342c1faf94b76a10c63484a84730","abstract_canon_sha256":"dcac02ae0b4559f7f4f48d8f5fa767bd4fe97a09a813604072a4c3e888cdbdad"},"schema_version":"1.0"},"canonical_sha256":"6b03f8285a6a70d3ade6f5d85d377d42a69898557b3236c98206a6751a356b42","source":{"kind":"arxiv","id":"2109.10465","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2109.10465","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"arxiv_version","alias_value":"2109.10465v1","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2109.10465","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"pith_short_12","alias_value":"NMB7QKC2NJYN","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"pith_short_16","alias_value":"NMB7QKC2NJYNHLPG","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"pith_short_8","alias_value":"NMB7QKC2","created_at":"2026-07-05T03:16:36Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2021:NMB7QKC2NJYNHLPG6XMF2N35IK","target":"record","payload":{"canonical_record":{"source":{"id":"2109.10465","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2021-09-22T00:57:46Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"1081b2af858259c4909b86775021934b23d9342c1faf94b76a10c63484a84730","abstract_canon_sha256":"dcac02ae0b4559f7f4f48d8f5fa767bd4fe97a09a813604072a4c3e888cdbdad"},"schema_version":"1.0"},"canonical_sha256":"6b03f8285a6a70d3ade6f5d85d377d42a69898557b3236c98206a6751a356b42","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T03:16:36.497693Z","signature_b64":"9laqC697yEiudQfsgOXGMS9JdQ6p64rv25pgJF7NefPSl/e8AZRzyfN+UYwW705+vFIN3LktzSQEJXvfMrWlDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6b03f8285a6a70d3ade6f5d85d377d42a69898557b3236c98206a6751a356b42","last_reissued_at":"2026-07-05T03:16:36.497283Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T03:16:36.497283Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2109.10465","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T03:16:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"crqmplzZwQ7yCO8AYhegBwaW3aCOYdlU1h34N7B6QaTBEpidgnXeCHTHbk9CdtwruHl3fKqLGY4eBs9xCD8gCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T11:57:03.363225Z"},"content_sha256":"4e24036cab5089c306b45268a0a6214d7e8ee55e2c48d6d3e51d7de540eb6a38","schema_version":"1.0","event_id":"sha256:4e24036cab5089c306b45268a0a6214d7e8ee55e2c48d6d3e51d7de540eb6a38"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2021:NMB7QKC2NJYNHLPG6XMF2N35IK","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Scalable and Efficient MoE Training for Multitask Multilingual Models","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.LG"],"primary_cat":"cs.CL","authors_text":"Alexandre Muzio, Ammar Ahmad Awan, Amr Hendy, Andres Felipe Cruz Salinas, Hany Hassan Awadalla, Liyang Lu, Samyam Rajbhandari, Young Jin Kim, Yuxiong He","submitted_at":"2021-09-22T00:57:46Z","abstract_excerpt":"The Mixture of Experts (MoE) models are an emerging class of sparsely activated deep learning models that have sublinear compute costs with respect to their parameters. In contrast with dense models, the sparse architecture of MoE offers opportunities for drastically growing model size with significant accuracy gain while consuming much lower compute budget. However, supporting large scale MoE training also has its own set of system and modeling challenges. To overcome the challenges and embrace the opportunities of MoE, we first develop a system capable of scaling MoE models efficiently to tr"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2109.10465","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2109.10465/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T03:16:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OSP8KQZ/hRnne1IkYI9lYBksnVhzffVlHiP8MQVGKFTYf3mdYJvRwbwSMbE8FPd3qkjcuOUWex2KORLQhiWIDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T11:57:03.363611Z"},"content_sha256":"f2166b73f361845d94a1db9a71e75960ff92313bb06820de99ae8a6a19e49e4a","schema_version":"1.0","event_id":"sha256:f2166b73f361845d94a1db9a71e75960ff92313bb06820de99ae8a6a19e49e4a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NMB7QKC2NJYNHLPG6XMF2N35IK/bundle.json","state_url":"https://pith.science/pith/NMB7QKC2NJYNHLPG6XMF2N35IK/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NMB7QKC2NJYNHLPG6XMF2N35IK/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T11:57:03Z","links":{"resolver":"https://pith.science/pith/NMB7QKC2NJYNHLPG6XMF2N35IK","bundle":"https://pith.science/pith/NMB7QKC2NJYNHLPG6XMF2N35IK/bundle.json","state":"https://pith.science/pith/NMB7QKC2NJYNHLPG6XMF2N35IK/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NMB7QKC2NJYNHLPG6XMF2N35IK/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2021:NMB7QKC2NJYNHLPG6XMF2N35IK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"dcac02ae0b4559f7f4f48d8f5fa767bd4fe97a09a813604072a4c3e888cdbdad","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2021-09-22T00:57:46Z","title_canon_sha256":"1081b2af858259c4909b86775021934b23d9342c1faf94b76a10c63484a84730"},"schema_version":"1.0","source":{"id":"2109.10465","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2109.10465","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"arxiv_version","alias_value":"2109.10465v1","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2109.10465","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"pith_short_12","alias_value":"NMB7QKC2NJYN","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"pith_short_16","alias_value":"NMB7QKC2NJYNHLPG","created_at":"2026-07-05T03:16:36Z"},{"alias_kind":"pith_short_8","alias_value":"NMB7QKC2","created_at":"2026-07-05T03:16:36Z"}],"graph_snapshots":[{"event_id":"sha256:f2166b73f361845d94a1db9a71e75960ff92313bb06820de99ae8a6a19e49e4a","target":"graph","created_at":"2026-07-05T03:16:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2109.10465/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"The Mixture of Experts (MoE) models are an emerging class of sparsely activated deep learning models that have sublinear compute costs with respect to their parameters. In contrast with dense models, the sparse architecture of MoE offers opportunities for drastically growing model size with significant accuracy gain while consuming much lower compute budget. However, supporting large scale MoE training also has its own set of system and modeling challenges. To overcome the challenges and embrace the opportunities of MoE, we first develop a system capable of scaling MoE models efficiently to tr","authors_text":"Alexandre Muzio, Ammar Ahmad Awan, Amr Hendy, Andres Felipe Cruz Salinas, Hany Hassan Awadalla, Liyang Lu, Samyam Rajbhandari, Young Jin Kim, Yuxiong He","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2021-09-22T00:57:46Z","title":"Scalable and Efficient MoE Training for Multitask Multilingual Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2109.10465","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4e24036cab5089c306b45268a0a6214d7e8ee55e2c48d6d3e51d7de540eb6a38","target":"record","created_at":"2026-07-05T03:16:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"dcac02ae0b4559f7f4f48d8f5fa767bd4fe97a09a813604072a4c3e888cdbdad","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2021-09-22T00:57:46Z","title_canon_sha256":"1081b2af858259c4909b86775021934b23d9342c1faf94b76a10c63484a84730"},"schema_version":"1.0","source":{"id":"2109.10465","kind":"arxiv","version":1}},"canonical_sha256":"6b03f8285a6a70d3ade6f5d85d377d42a69898557b3236c98206a6751a356b42","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6b03f8285a6a70d3ade6f5d85d377d42a69898557b3236c98206a6751a356b42","first_computed_at":"2026-07-05T03:16:36.497283Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T03:16:36.497283Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"9laqC697yEiudQfsgOXGMS9JdQ6p64rv25pgJF7NefPSl/e8AZRzyfN+UYwW705+vFIN3LktzSQEJXvfMrWlDA==","signature_status":"signed_v1","signed_at":"2026-07-05T03:16:36.497693Z","signed_message":"canonical_sha256_bytes"},"source_id":"2109.10465","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4e24036cab5089c306b45268a0a6214d7e8ee55e2c48d6d3e51d7de540eb6a38","sha256:f2166b73f361845d94a1db9a71e75960ff92313bb06820de99ae8a6a19e49e4a"],"state_sha256":"dd359e0012c9405a5d16bdbd19a480f8e9c6e1fbb40f044c353a228905fb523a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Ym23zCAC1OTiO53pc36mbblxsxu6029v0KukU80ZuMt6CRd+UPGVZiyzwqGXINFZZlP0A+sQH+euBM9J9bezBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T11:57:03.365626Z","bundle_sha256":"aa85e46b53c580255bc554eaeeac07c091612b4e3a0662ac004c4aeccf6333a5"}}