{"id":"https://openalex.org/W2098249418","doi":"https://doi.org/10.1145/1460027.1460046","title":"Cross-lingual query classification","display_name":"Cross-lingual query classification","publication_year":2008,"publication_date":"2008-10-30","ids":{"openalex":"https://openalex.org/W2098249418","doi":"https://doi.org/10.1145/1460027.1460046","mag":"2098249418"},"language":"en","primary_location":{"id":"doi:10.1145/1460027.1460046","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1460027.1460046","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd ACM workshop on Improving non english web searching","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012483706","display_name":"Xuerui Wang","orcid":"https://orcid.org/0000-0001-8938-3420"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuerui Wang","raw_affiliation_strings":["University of Massachusetts, Amherst, MA, USA","University of Massachusetts, Amherst, MA, USA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Massachusetts, Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"University of Massachusetts, Amherst, MA, USA#TAB#","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108541542","display_name":"Andrei Broder","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrei Broder","raw_affiliation_strings":["Yahoo! Research, Santa Clara, CA, USA","Yahoo! Research, Santa Clara , CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Research, Santa Clara , CA, USA","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013932834","display_name":"Evgeniy Gabrilovich","orcid":"https://orcid.org/0000-0001-7933-1926"},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Evgeniy Gabrilovich","raw_affiliation_strings":["Yahoo! Research, Santa Clara, CA, USA","Yahoo! Research, Santa Clara , CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Research, Santa Clara , CA, USA","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037908462","display_name":"Vanja Josifovski","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vanja Josifovski","raw_affiliation_strings":["Yahoo! Research, Santa Clara, CA, USA","Yahoo! Research, Santa Clara , CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Research, Santa Clara , CA, USA","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101799605","display_name":"Bo Pang","orcid":"https://orcid.org/0000-0003-4521-6369"},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bo Pang","raw_affiliation_strings":["Yahoo! Research, Santa Clara, CA, USA","Yahoo! Research, Santa Clara , CA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Research, Santa Clara , CA, USA","institution_ids":["https://openalex.org/I4210134091"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7514,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.89526133,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"101","last_page":"104"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8608042001724243},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6324031949043274},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.5690906643867493},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5639755725860596},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5474858283996582},{"id":"https://openalex.org/keywords/taxonomy","display_name":"Taxonomy (biology)","score":0.5374671816825867},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.5286588668823242},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49712398648262024},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46932193636894226},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.46800413727760315},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.45217329263687134},{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.4408096373081207},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4126896560192108},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.3526257872581482},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3504086136817932}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8608042001724243},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6324031949043274},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.5690906643867493},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5639755725860596},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5474858283996582},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.5374671816825867},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.5286588668823242},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49712398648262024},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46932193636894226},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.46800413727760315},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.45217329263687134},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.4408096373081207},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4126896560192108},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.3526257872581482},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3504086136817932},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1460027.1460046","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1460027.1460046","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd ACM workshop on Improving non english web searching","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1489959797","https://openalex.org/W1972640883","https://openalex.org/W1994966918","https://openalex.org/W2064885744","https://openalex.org/W2098876286","https://openalex.org/W2099031744","https://openalex.org/W2123198781","https://openalex.org/W2145631291","https://openalex.org/W2150749667"],"related_works":["https://openalex.org/W2096359267","https://openalex.org/W2901901036","https://openalex.org/W2026738364","https://openalex.org/W1521725692","https://openalex.org/W2093300859","https://openalex.org/W3008917487","https://openalex.org/W2124814993","https://openalex.org/W2013069866","https://openalex.org/W3197639690","https://openalex.org/W2572349046"],"abstract_inverted_index":{"The":[0],"non-English":[1,55,140],"Web":[2,130],"is":[3,57,61,94,104],"growing":[4],"at":[5],"breakneck":[6],"speed,":[7],"but":[8],"available":[9,43],"language":[10,169],"processing":[11,79],"tools":[12],"are":[13,18,25,40],"mostly":[14],"English":[15,34,67,144],"based.":[16],"Taxonomies":[17],"a":[19,101,135],"case":[20],"in":[21,53,81,87,165],"point:":[22],"while":[23],"there":[24],"plenty":[26],"of":[27,45,122,128,173,180],"commercial":[28,129],"and":[29,112,118,146],"non-commercial":[30],"taxonomies":[31,36,52,68],"for":[32,37,107,119,138,189],"the":[33,92,109,125,162,166,178],"Web,":[35],"other":[38,82],"languages":[39,56],"either":[41],"not":[42],"or":[44,183],"very":[46],"limited":[47],"quality.":[48],"Given":[49],"that":[50,91,159,193],"building":[51],"all":[54],"prohibitively":[58],"expensive,":[59],"it":[60],"natural":[62],"to":[63,76,98],"ask":[64],"whether":[65],"existing":[66],"can":[69,176],"be":[70],"leveraged,":[71],"possibly":[72],"via":[73],"machine":[74,152,185],"translation,":[75],"enable":[77],"information":[78],"tasks":[80],"languages.":[83],"Preliminary":[84],"results":[85,164,188],"presented":[86],"this":[88],"paper":[89],"indicate":[90],"answer":[93],"affirmative":[95],"with":[96],"respect":[97],"query":[99],"classification,":[100],"task":[102],"which":[103],"essential":[105],"both":[106],"understanding":[108],"user":[110],"intent":[111],"thus":[113],"provide":[114],"better":[115,120],"search":[116,131,163],"results,":[117],"targeting":[121],"search-based":[123],"advertising,":[124],"economic":[126],"underpinning":[127],"engines.":[132],"We":[133],"propose":[134],"robust":[136],"method":[137],"classifying":[139],"queries":[141,191],"against":[142],"an":[143],"taxonomy":[145],"classifier":[147],"using":[148],"widely":[149],"available,":[150],"off-the-shelf":[151],"translation":[153],"systems.":[154],"In":[155],"particular,":[156],"we":[157,175,194],"show":[158,192],"by":[160],"viewing":[161],"query's":[167],"original":[168],"as":[170],"independent":[171],"sources":[172],"information,":[174],"alleviate":[177],"impact":[179],"poor":[181],"quality":[182],"erroneous":[184],"translations.":[186],"Empirical":[187],"Chinese":[190],"achieve":[195],"remarkably":[196],"encouraging":[197],"results.":[198]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
