{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:AWVDMIX6SMDOJINH6GLWPXG2OA","short_pith_number":"pith:AWVDMIX6","schema_version":"1.0","canonical_sha256":"05aa3622fe9306e4a1a7f19767dcda7029fb7eca393e78b3ac92918c808ce36a","source":{"kind":"arxiv","id":"2606.01164","version":1},"attestation_state":"computed","paper":{"title":"Towards Interactive Video World Modeling: Frontiers, Challenges, Benchmarks, and Future Trends","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Ayush Tewari, Chaojun Ni, Chensheng Peng, Fangjinhua Wang, Jiuming Liu, Marc Pollefeys, Masayoshi Tomizuka, Mengmeng Liu, Per Ola Kristensson, Sitian Shen","submitted_at":"2026-05-31T11:12:30Z","abstract_excerpt":"With rapid development of large language models and diffusion-based content generation, world modeling has attracted increasing research attention, benefiting various downstream domains such as game engines, embodied AI, autonomous driving, etc. Through explicitly incorporating user actions into world state transition, recent literature empowers world modeling with interactivity in an action-conditioned video or 3D generation paradigm, further enhancing controllability over world evolutions and facilitating users to freely traverse, manipulate, navigate, and personalize the state evolution. In"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.01164","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-05-31T11:12:30Z","cross_cats_sorted":[],"title_canon_sha256":"56cc45477f19494754e73508715dce8e99c18556164ffbc2af468e1763f4abb1","abstract_canon_sha256":"ff8ed6deca0e4aced49cfa25a250d026ffc4650ef2879c78bf1093626e317c5b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T02:04:25.506268Z","signature_b64":"MIfMns0YfY8N+SZutJ56d80vnET5Hcc0yNDA6G+ZKlx07qVrGzC/Lk4s5Vl4fBmplYp//RwZ+qcAzj4ThtefBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"05aa3622fe9306e4a1a7f19767dcda7029fb7eca393e78b3ac92918c808ce36a","last_reissued_at":"2026-06-02T02:04:25.505882Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T02:04:25.505882Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Towards Interactive Video World Modeling: Frontiers, Challenges, Benchmarks, and Future Trends","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Ayush Tewari, Chaojun Ni, Chensheng Peng, Fangjinhua Wang, Jiuming Liu, Marc Pollefeys, Masayoshi Tomizuka, Mengmeng Liu, Per Ola Kristensson, Sitian Shen","submitted_at":"2026-05-31T11:12:30Z","abstract_excerpt":"With rapid development of large language models and diffusion-based content generation, world modeling has attracted increasing research attention, benefiting various downstream domains such as game engines, embodied AI, autonomous driving, etc. Through explicitly incorporating user actions into world state transition, recent literature empowers world modeling with interactivity in an action-conditioned video or 3D generation paradigm, further enhancing controllability over world evolutions and facilitating users to freely traverse, manipulate, navigate, and personalize the state evolution. In"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.01164","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.01164/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.01164","created_at":"2026-06-02T02:04:25.505946+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.01164v1","created_at":"2026-06-02T02:04:25.505946+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.01164","created_at":"2026-06-02T02:04:25.505946+00:00"},{"alias_kind":"pith_short_12","alias_value":"AWVDMIX6SMDO","created_at":"2026-06-02T02:04:25.505946+00:00"},{"alias_kind":"pith_short_16","alias_value":"AWVDMIX6SMDOJINH","created_at":"2026-06-02T02:04:25.505946+00:00"},{"alias_kind":"pith_short_8","alias_value":"AWVDMIX6","created_at":"2026-06-02T02:04:25.505946+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA","json":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA.json","graph_json":"https://pith.science/api/pith-number/AWVDMIX6SMDOJINH6GLWPXG2OA/graph.json","events_json":"https://pith.science/api/pith-number/AWVDMIX6SMDOJINH6GLWPXG2OA/events.json","paper":"https://pith.science/paper/AWVDMIX6"},"agent_actions":{"view_html":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA","download_json":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA.json","view_paper":"https://pith.science/paper/AWVDMIX6","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.01164&json=true","fetch_graph":"https://pith.science/api/pith-number/AWVDMIX6SMDOJINH6GLWPXG2OA/graph.json","fetch_events":"https://pith.science/api/pith-number/AWVDMIX6SMDOJINH6GLWPXG2OA/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA/action/timestamp_anchor","attest_storage":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA/action/storage_attestation","attest_author":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA/action/author_attestation","sign_citation":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA/action/citation_signature","submit_replication":"https://pith.science/pith/AWVDMIX6SMDOJINH6GLWPXG2OA/action/replication_record"}},"created_at":"2026-06-02T02:04:25.505946+00:00","updated_at":"2026-06-02T02:04:25.505946+00:00"}