{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2011:34C7JOXCDK3S7VSBYZWDUIB4G3","short_pith_number":"pith:34C7JOXC","schema_version":"1.0","canonical_sha256":"df05f4bae21ab72fd641c66c3a203c36fcc768093cc1dd56115fe3094adba8d3","source":{"kind":"arxiv","id":"1111.1497","version":4},"attestation_state":"computed","paper":{"title":"An IR-based Evaluation Framework for Web Search Query Segmentation","license":"http://creativecommons.org/licenses/by/3.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Monojit Choudhury, Niloy Ganguly, Rishiraj Saha Roy, Srivatsan Laxman","submitted_at":"2011-11-07T07:26:27Z","abstract_excerpt":"This paper presents the first evaluation framework for Web search query segmentation based directly on IR performance. In the past, segmentation strategies were mainly validated against manual annotations. Our work shows that the goodness of a segmentation algorithm as judged through evaluation against a handful of human annotated segmentations hardly reflects its effectiveness in an IR-based setup. In fact, state-of the-art algorithms are shown to perform as good as, and sometimes even better than human annotations -- a fact masked by previous validations. The proposed framework also provides"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1111.1497","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/3.0/","primary_cat":"cs.IR","submitted_at":"2011-11-07T07:26:27Z","cross_cats_sorted":[],"title_canon_sha256":"de314bde3235338a107843010916d40839d322b540c0e29d459b35a14996af3e","abstract_canon_sha256":"00608e8459fd5a3f6de1f8cc0968df5d803fd1d9f5b078257eecff01b54d0168"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:21:34.867898Z","signature_b64":"joZ8kuHYl2ZPfF15RD/7BDnPeYyEu12DRo9sn0FTtUGUrT+pG0yZ3lAv0jUK8nX54PSZP24s6kzcMPLg1IwqCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"df05f4bae21ab72fd641c66c3a203c36fcc768093cc1dd56115fe3094adba8d3","last_reissued_at":"2026-05-18T02:21:34.867411Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:21:34.867411Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"An IR-based Evaluation Framework for Web Search Query Segmentation","license":"http://creativecommons.org/licenses/by/3.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Monojit Choudhury, Niloy Ganguly, Rishiraj Saha Roy, Srivatsan Laxman","submitted_at":"2011-11-07T07:26:27Z","abstract_excerpt":"This paper presents the first evaluation framework for Web search query segmentation based directly on IR performance. In the past, segmentation strategies were mainly validated against manual annotations. Our work shows that the goodness of a segmentation algorithm as judged through evaluation against a handful of human annotated segmentations hardly reflects its effectiveness in an IR-based setup. In fact, state-of the-art algorithms are shown to perform as good as, and sometimes even better than human annotations -- a fact masked by previous validations. The proposed framework also provides"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1111.1497","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1111.1497","created_at":"2026-05-18T02:21:34.867480+00:00"},{"alias_kind":"arxiv_version","alias_value":"1111.1497v4","created_at":"2026-05-18T02:21:34.867480+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1111.1497","created_at":"2026-05-18T02:21:34.867480+00:00"},{"alias_kind":"pith_short_12","alias_value":"34C7JOXCDK3S","created_at":"2026-05-18T12:26:18.847500+00:00"},{"alias_kind":"pith_short_16","alias_value":"34C7JOXCDK3S7VSB","created_at":"2026-05-18T12:26:18.847500+00:00"},{"alias_kind":"pith_short_8","alias_value":"34C7JOXC","created_at":"2026-05-18T12:26:18.847500+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3","json":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3.json","graph_json":"https://pith.science/api/pith-number/34C7JOXCDK3S7VSBYZWDUIB4G3/graph.json","events_json":"https://pith.science/api/pith-number/34C7JOXCDK3S7VSBYZWDUIB4G3/events.json","paper":"https://pith.science/paper/34C7JOXC"},"agent_actions":{"view_html":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3","download_json":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3.json","view_paper":"https://pith.science/paper/34C7JOXC","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1111.1497&json=true","fetch_graph":"https://pith.science/api/pith-number/34C7JOXCDK3S7VSBYZWDUIB4G3/graph.json","fetch_events":"https://pith.science/api/pith-number/34C7JOXCDK3S7VSBYZWDUIB4G3/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3/action/timestamp_anchor","attest_storage":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3/action/storage_attestation","attest_author":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3/action/author_attestation","sign_citation":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3/action/citation_signature","submit_replication":"https://pith.science/pith/34C7JOXCDK3S7VSBYZWDUIB4G3/action/replication_record"}},"created_at":"2026-05-18T02:21:34.867480+00:00","updated_at":"2026-05-18T02:21:34.867480+00:00"}