{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:BZL4LUJIAY6TJJNCWX32TZNE4H","short_pith_number":"pith:BZL4LUJI","schema_version":"1.0","canonical_sha256":"0e57c5d128063d34a5a2b5f7a9e5a4e1e4c9e88a64118890aeb707745d9b9ba3","source":{"kind":"arxiv","id":"2606.04484","version":1},"attestation_state":"computed","paper":{"title":"AgentJet: A Flexible Swarm Training Framework for Agentic Reinforcement Learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG","cs.MA"],"primary_cat":"cs.AI","authors_text":"Bolin Ding, Boyin Liu, Qingxu Fu, Shuchang Tao, Zhaoyang Liu","submitted_at":"2026-06-03T06:02:52Z","abstract_excerpt":"We present AgentJet, a distributed swarm training framework for large language model (LLM) agent reinforcement learning. Unlike centralized frameworks that tightly couple agent rollouts with model optimization, AgentJet adopts a decoupled multi-node architecture in which swarm server nodes host trainable models and run optimization on GPU clusters, whereas swarm client nodes execute arbitrary agents on arbitrary devices. This design provides capabilities that are difficult to support in centralized frameworks: (1) heterogeneous multi-model reinforcement learning, enabling the training of heter"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.04484","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-06-03T06:02:52Z","cross_cats_sorted":["cs.LG","cs.MA"],"title_canon_sha256":"2f8e03312713f2b6fe84c23ff44d424c2d4ce1789fd423c0f4ed589a18ce103b","abstract_canon_sha256":"7b5593e323ab149c223f6a4821f160547b6b3538a3ae05b9d65bae57b803c4d5"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-04T01:09:10.033529Z","signature_b64":"+QIgFPkE1JGmx1e2BlAddDTtL9o8pt3LMMJvzuU/L3kLBQNsKxNX1/sNKpevGgx3T/fw1RAA81dvsPAJge5ACg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0e57c5d128063d34a5a2b5f7a9e5a4e1e4c9e88a64118890aeb707745d9b9ba3","last_reissued_at":"2026-06-04T01:09:10.033093Z","signature_status":"signed_v1","first_computed_at":"2026-06-04T01:09:10.033093Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"AgentJet: A Flexible Swarm Training Framework for Agentic Reinforcement Learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG","cs.MA"],"primary_cat":"cs.AI","authors_text":"Bolin Ding, Boyin Liu, Qingxu Fu, Shuchang Tao, Zhaoyang Liu","submitted_at":"2026-06-03T06:02:52Z","abstract_excerpt":"We present AgentJet, a distributed swarm training framework for large language model (LLM) agent reinforcement learning. Unlike centralized frameworks that tightly couple agent rollouts with model optimization, AgentJet adopts a decoupled multi-node architecture in which swarm server nodes host trainable models and run optimization on GPU clusters, whereas swarm client nodes execute arbitrary agents on arbitrary devices. This design provides capabilities that are difficult to support in centralized frameworks: (1) heterogeneous multi-model reinforcement learning, enabling the training of heter"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.04484","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.04484/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.04484","created_at":"2026-06-04T01:09:10.033155+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.04484v1","created_at":"2026-06-04T01:09:10.033155+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.04484","created_at":"2026-06-04T01:09:10.033155+00:00"},{"alias_kind":"pith_short_12","alias_value":"BZL4LUJIAY6T","created_at":"2026-06-04T01:09:10.033155+00:00"},{"alias_kind":"pith_short_16","alias_value":"BZL4LUJIAY6TJJNC","created_at":"2026-06-04T01:09:10.033155+00:00"},{"alias_kind":"pith_short_8","alias_value":"BZL4LUJI","created_at":"2026-06-04T01:09:10.033155+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H","json":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H.json","graph_json":"https://pith.science/api/pith-number/BZL4LUJIAY6TJJNCWX32TZNE4H/graph.json","events_json":"https://pith.science/api/pith-number/BZL4LUJIAY6TJJNCWX32TZNE4H/events.json","paper":"https://pith.science/paper/BZL4LUJI"},"agent_actions":{"view_html":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H","download_json":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H.json","view_paper":"https://pith.science/paper/BZL4LUJI","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.04484&json=true","fetch_graph":"https://pith.science/api/pith-number/BZL4LUJIAY6TJJNCWX32TZNE4H/graph.json","fetch_events":"https://pith.science/api/pith-number/BZL4LUJIAY6TJJNCWX32TZNE4H/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H/action/timestamp_anchor","attest_storage":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H/action/storage_attestation","attest_author":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H/action/author_attestation","sign_citation":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H/action/citation_signature","submit_replication":"https://pith.science/pith/BZL4LUJIAY6TJJNCWX32TZNE4H/action/replication_record"}},"created_at":"2026-06-04T01:09:10.033155+00:00","updated_at":"2026-06-04T01:09:10.033155+00:00"}