{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:JFVI2FV2KCVXMO52HS2MTWQVOG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f5b3a5175e07972709125aafc1e437ff761197f414a8fa0d34ff57d1ba239d12","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T06:56:53Z","title_canon_sha256":"03af7affd16b6efc9d6d76b6e9aa0436e6c8531e8f941733939d182bc6ec332e"},"schema_version":"1.0","source":{"id":"2605.14461","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.14461","created_at":"2026-05-17T23:39:06Z"},{"alias_kind":"arxiv_version","alias_value":"2605.14461v1","created_at":"2026-05-17T23:39:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14461","created_at":"2026-05-17T23:39:06Z"},{"alias_kind":"pith_short_12","alias_value":"JFVI2FV2KCVX","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"JFVI2FV2KCVXMO52","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"JFVI2FV2","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:e4785a39db275f67fff89584a4b77b59b4bf2610515089c0f7c6af4bd029d1b3","target":"graph","created_at":"2026-05-17T23:39:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"ClickRemoval localizes target objects and restores the background through self-attention modulation during denoising without additional training, hand-drawn masks, or text descriptions, achieving competitive results across quantitative metrics and user studies."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That user clicks alone, combined with self-attention modulation in a pretrained Stable Diffusion model, are sufficient to accurately localize objects and produce natural background completions in complex scenes."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"ClickRemoval delivers click-driven object removal and background restoration in diffusion models through self-attention modulation without additional training or inputs."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Clicks alone let users remove objects from images in pretrained diffusion models"}],"snapshot_sha256":"870d9af08fee772987712d274b31fdafe7ba6f975cf91bb75c7a8b5064492bbc"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Existing object removal tools often rely on manual masks or text prompts, making precise removal difficult for non-expert users in complex scenes and often leading to incomplete removal or unnatural background completion. To address this issue, we present ClickRemoval, an open-source interactive object removal tool built on pretrained Stable Diffusion models and driven solely by user clicks. Without additional training, hand-drawn masks, or text descriptions, ClickRemoval localizes target objects and restores the background through self-attention modulation during denoising. Experiments show t","authors_text":"Ledun Zhang, Xinying Yao, Xufei Zhuang, Yatu Ji","cross_cats":[],"headline":"Clicks alone let users remove objects from images in pretrained diffusion models","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T06:56:53Z","title":"ClickRemoval: An Interactive Open-Source Tool for Object Removal in Diffusion Models"},"references":{"count":15,"internal_anchors":0,"resolved_work":15,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"Aditya Chandrasekar, Goirik Chakrabarty, Jai Bardhan, Ramya Hebbalaguppe, and Prathosh AP. 2024. Remove: A reference-free metric for object erasure. InPro- ceedings of the IEEE/CVF Conference on Compu","work_id":"142283c7-6131-42ba-bd0c-904cc7032508","year":2024},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"Nima Fathi, Amar Kumar, and Tal Arbel. 2025. Aura: A multi-modal medical agent for understanding, reasoning and annotation. InInternational Workshop on Agentic AI for Medicine. 105–114","work_id":"6d1b0e57-1367-48e5-a973-7ce0dda59672","year":2025},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":3,"title":"Tariq Berrada Ifriqi, Adriana Romero-Soriano, Michal Drozdzal, Jakob Verbeek, and Karteek Alahari. 2025. Entropy Rectifying Guidance for Diffusion and Flow Models. InNeurIPS 2025-Thirty-ninth Conferen","work_id":"5fa38a74-a531-4809-8028-57a347b870a8","year":2025},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"Xuan Ju, Xian Liu, Xintao Wang, Yuxuan Bian, Ying Shan, and Qiang Xu. 2024. Brushnet: A plug-and-play image inpainting model with decomposed dual- branch diffusion. InEuropean Conference on Computer V","work_id":"84fd47ed-f9ff-462b-b1ef-3e85422662af","year":2024},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"Markus Karmann and Onay Urfalioglu. 2025. Repurposing stable diffusion attention for training-free unsupervised interactive segmentation. InProceedings of the Computer Vision and Pattern Recognition C","work_id":"9b4198be-ddba-4818-bef6-7dd84e3edb02","year":2025}],"snapshot_sha256":"a7125be0ef49186b070aa97230f10c53d7ea48d1fccfdb8e6413570f5e4c34dc"},"source":{"id":"2605.14461","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-15T02:44:52.808238Z","id":"deeaec04-eef5-47b2-bbd3-1e3816176e42","model_set":{"reader":"grok-4.3"},"one_line_summary":"ClickRemoval delivers click-driven object removal and background restoration in diffusion models through self-attention modulation without additional training or inputs.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Clicks alone let users remove objects from images in pretrained diffusion models","strongest_claim":"ClickRemoval localizes target objects and restores the background through self-attention modulation during denoising without additional training, hand-drawn masks, or text descriptions, achieving competitive results across quantitative metrics and user studies.","weakest_assumption":"That user clicks alone, combined with self-attention modulation in a pretrained Stable Diffusion model, are sufficient to accurately localize objects and produce natural background completions in complex scenes."}},"verdict_id":"deeaec04-eef5-47b2-bbd3-1e3816176e42"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b13280d76b3de7e01599d50b974fa3e4d5924475f81e2785b02db4695be82a29","target":"record","created_at":"2026-05-17T23:39:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f5b3a5175e07972709125aafc1e437ff761197f414a8fa0d34ff57d1ba239d12","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T06:56:53Z","title_canon_sha256":"03af7affd16b6efc9d6d76b6e9aa0436e6c8531e8f941733939d182bc6ec332e"},"schema_version":"1.0","source":{"id":"2605.14461","kind":"arxiv","version":1}},"canonical_sha256":"496a8d16ba50ab763bba3cb4c9da1571979ac47824c86f0b8b5117958e9c46f2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"496a8d16ba50ab763bba3cb4c9da1571979ac47824c86f0b8b5117958e9c46f2","first_computed_at":"2026-05-17T23:39:06.776601Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:06.776601Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"knq/LVvevCriczCKVNFXeYst0BNh2x1BaKlcScSsjoE1Oka8ru5IG2yLyRsnNZ/X5ZYIimoTNo4GFr8zyihOCw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:06.777297Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.14461","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b13280d76b3de7e01599d50b974fa3e4d5924475f81e2785b02db4695be82a29","sha256:e4785a39db275f67fff89584a4b77b59b4bf2610515089c0f7c6af4bd029d1b3"],"state_sha256":"8c5f48dd1e675f010a9d7eb20f365fb18ecf3882a2a28140219c6f0f9226badd"}