{"id":"https://openalex.org/W2082130842","doi":"https://doi.org/10.1145/1183614.1183711","title":"Coupling feature selection and machine learning methods for navigational query identification","display_name":"Coupling feature selection and machine learning methods for navigational query identification","publication_year":2006,"publication_date":"2006-01-01","ids":{"openalex":"https://openalex.org/W2082130842","doi":"https://doi.org/10.1145/1183614.1183711","mag":"2082130842"},"language":"en","primary_location":{"id":"doi:10.1145/1183614.1183711","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1183614.1183711","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th ACM international conference on Information and knowledge management  - CIKM '06","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104036890","display_name":"Yumao Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yumao Lu","raw_affiliation_strings":["Yahoo! Inc., Sunnyvale, California","Yahoo! Inc., Sunnyvale, California#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047400593","display_name":"Fuchun Peng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fuchun Peng","raw_affiliation_strings":["Yahoo! Inc., Sunnyvale, California","Yahoo! Inc., Sunnyvale, California#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100353780","display_name":"Xin Li","orcid":"https://orcid.org/0000-0002-0041-3134"},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xin Li","raw_affiliation_strings":["Yahoo! Inc., Sunnyvale, California","Yahoo! Inc., Sunnyvale, California#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016105683","display_name":"Nawaaz Ahmed","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nawaaz Ahmed","raw_affiliation_strings":["Yahoo! Inc., Sunnyvale, California","Yahoo! Inc., Sunnyvale, California#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Inc., Sunnyvale, California#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5104036890"],"corresponding_institution_ids":["https://openalex.org/I4210134091"],"apc_list":null,"apc_paid":null,"fwci":2.5819,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.9148821,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"682","last_page":"682"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8195520639419556},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.7116213440895081},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6769455075263977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6348541975021362},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.5737502574920654},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.528972327709198},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.5105608701705933},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.49160465598106384},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.4579888582229614},{"id":"https://openalex.org/keywords/information-gain-ratio","display_name":"Information gain ratio","score":0.4507963955402374},{"id":"https://openalex.org/keywords/gradient-boosting","display_name":"Gradient boosting","score":0.4415450692176819},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.42355674505233765},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.41988909244537354},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.38521113991737366},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.3399333357810974},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.25580888986587524}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8195520639419556},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.7116213440895081},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6769455075263977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6348541975021362},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.5737502574920654},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.528972327709198},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.5105608701705933},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.49160465598106384},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.4579888582229614},{"id":"https://openalex.org/C202185110","wikidata":"https://www.wikidata.org/wiki/Q6031086","display_name":"Information gain ratio","level":3,"score":0.4507963955402374},{"id":"https://openalex.org/C70153297","wikidata":"https://www.wikidata.org/wiki/Q5591907","display_name":"Gradient boosting","level":3,"score":0.4415450692176819},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.42355674505233765},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.41988909244537354},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.38521113991737366},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.3399333357810974},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25580888986587524}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1183614.1183711","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1183614.1183711","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th ACM international conference on Information and knowledge management  - CIKM '06","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.94.4213","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.94.4213","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.ee.ucla.edu/~luym/LuPengLiAhmed06CIKM.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1554944419","https://openalex.org/W1965073581","https://openalex.org/W1985182453","https://openalex.org/W1998548536","https://openalex.org/W2010463775","https://openalex.org/W2024869911","https://openalex.org/W2070493638","https://openalex.org/W2102667697","https://openalex.org/W2104217798","https://openalex.org/W2124658502","https://openalex.org/W2149684865","https://openalex.org/W2155540986","https://openalex.org/W2156037541","https://openalex.org/W2156909104","https://openalex.org/W2160842254","https://openalex.org/W2168239404","https://openalex.org/W2435251607","https://openalex.org/W2799061466","https://openalex.org/W2911427979","https://openalex.org/W3049188988"],"related_works":["https://openalex.org/W2026738364","https://openalex.org/W2096359267","https://openalex.org/W2901901036","https://openalex.org/W2124814993","https://openalex.org/W2113390685","https://openalex.org/W3114052401","https://openalex.org/W2330073594","https://openalex.org/W2163573236","https://openalex.org/W2093300859","https://openalex.org/W2013069866"],"abstract_inverted_index":{"It":[0],"is":[1,140,202,225],"important":[2,163],"yet":[3],"hard":[4],"to":[5,13,82,174,182,231,242],"identify":[6],"navigational":[7,54,108,169,214],"queries":[8,109,215],"in":[9,19,57,99],"Web":[10,20,58,122],"search":[11,119,123,145],"due":[12],"a":[14,94,243],"lack":[15],"of":[16,64,97,106,112,165],"sufficient":[17],"information":[18],"queries,":[21],"which":[22,224],"are":[23,160],"typically":[24],"very":[25],"short.":[26],"In":[27,172],"this":[28,100],"paper":[29],"we":[30,68,102,154],"study":[31,103],"several":[32,70],"machine":[33,45,66,178],"learning":[34,179],"methods,":[35],"including":[36],"naive":[37],"Bayes":[38],"model,":[39,42],"maximum":[40],"entropy":[41],"support":[43],"vector":[44],"(SVM),":[46],"and":[47,74,129,211,236],"stochastic":[48],"gradient":[49,193],"boosting":[50,194],"tree":[51],"(SGBT),":[52],"for":[53,167],"query":[55,127],"identification":[56],"search.":[59],"To":[60],"boost":[61],"the":[62,84,104,130,152,161,232],"performance":[63],"these":[65],"techniques,":[67],"exploit":[69],"feature":[71,77,137,187,200,209,248],"selection":[72,78,188,201,210],"methods":[73],"propose":[75],"coupling":[76],"with":[79,110,185,197,220],"classification":[80,212],"approaches":[81,180],"achieve":[83,175],"best":[85,233],"performance.":[86],"Different":[87],"from":[88,116],"most":[89,162,203],"prior":[90],"work":[91],"that":[92,148,192],"uses":[93],"small":[95],"number":[96],"features,":[98,114],"paper,":[101],"problem":[105],"identifying":[107,168],"thousands":[111],"available":[113],"extracted":[115],"major":[117],"commercial":[118],"engine":[120],"results,":[121],"user":[124,156],"click":[125,157],"data,":[126],"log,":[128],"whole":[131],"Web's":[132],"relational":[133],"content.":[134],"A":[135],"multi-level":[136],"extraction":[138],"system":[139,246],"constructed.Our":[141],"results":[142],"on":[143],"real":[144],"data":[146],"show":[147],"1)":[149],"Among":[150],"all":[151],"features":[153,159,166],"tested,":[155],"distribution":[158],"set":[164],"queries.":[170],"2)":[171],"order":[173],"good":[176,186],"performance,":[177],"have":[181],"be":[183,217],"coupled":[184,196,208],"methods.":[189],"We":[190],"find":[191],"tree,":[195],"linear":[198],"SVM":[199],"effective.":[204],"3)":[205],"With":[206],"carefully":[207],"approaches,":[213],"can":[216],"accurately":[218],"identified":[219],"88.1%":[221],"F1":[222],"score,":[223],"33%":[226],"error":[227,238],"rate":[228,239],"reduction":[229,240],"compared":[230,241],"uncoupled":[234],"system,":[235],"40%":[237],"well":[244],"tuned":[245],"without":[247],"selection.":[249]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":3},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
