{"id":"https://openalex.org/W2150155583","doi":"https://doi.org/10.1145/2600428.2609622","title":"Query expansion for mixed-script information retrieval","display_name":"Query expansion for mixed-script information retrieval","publication_year":2014,"publication_date":"2014-07-03","ids":{"openalex":"https://openalex.org/W2150155583","doi":"https://doi.org/10.1145/2600428.2609622","mag":"2150155583"},"language":"en","primary_location":{"id":"doi:10.1145/2600428.2609622","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2600428.2609622","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 37th international ACM SIGIR conference on Research &amp; development in information retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102919542","display_name":"Parth Gupta","orcid":"https://orcid.org/0000-0003-0232-3412"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Parth Gupta","raw_affiliation_strings":["Universitat Polit\u00e8cnica de Val\u00e8ncia, Valencia, Spain"],"affiliations":[{"raw_affiliation_string":"Universitat Polit\u00e8cnica de Val\u00e8ncia, Valencia, Spain","institution_ids":["https://openalex.org/I60053951"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013639574","display_name":"Kalika Bali","orcid":"https://orcid.org/0000-0001-9275-742X"},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Kalika Bali","raw_affiliation_strings":["Microsoft Research Labs India, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Labs India, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022050902","display_name":"Rafael E. Banchs","orcid":null},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Rafael E. Banchs","raw_affiliation_strings":["Institute for Infocomm Research, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, Singapore, Singapore","institution_ids":["https://openalex.org/I3005327000"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008944385","display_name":"Monojit Choudhury","orcid":"https://orcid.org/0000-0001-7473-7839"},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Monojit Choudhury","raw_affiliation_strings":["Microsoft Research Labs India, Bangalore, India"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Labs India, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053947754","display_name":"Paolo Rosso","orcid":"https://orcid.org/0000-0002-8922-1242"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Paolo Rosso","raw_affiliation_strings":["Universitat Polit\u00e8cnica de Val\u00e8ncia, Valencia, Spain"],"affiliations":[{"raw_affiliation_string":"Universitat Polit\u00e8cnica de Val\u00e8ncia, Valencia, Spain","institution_ids":["https://openalex.org/I60053951"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102919542"],"corresponding_institution_ids":["https://openalex.org/I60053951"],"apc_list":null,"apc_paid":null,"fwci":20.4506,"has_fulltext":false,"cited_by_count":99,"citation_normalized_percentile":{"value":0.99439309,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"677","last_page":"686"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.8343989849090576},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8325122594833374},{"id":"https://openalex.org/keywords/spelling","display_name":"Spelling","score":0.6389446258544922},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.5640323162078857},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5532228946685791},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5458763241767883},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5371594429016113},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5049200654029846},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4683358669281006},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.41741690039634705},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1551753282546997},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1429792046546936},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.07554447650909424}],"concepts":[{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.8343989849090576},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8325122594833374},{"id":"https://openalex.org/C2777801307","wikidata":"https://www.wikidata.org/wiki/Q2088390","display_name":"Spelling","level":2,"score":0.6389446258544922},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.5640323162078857},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5532228946685791},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5458763241767883},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5371594429016113},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5049200654029846},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4683358669281006},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.41741690039634705},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1551753282546997},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1429792046546936},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.07554447650909424},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2600428.2609622","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2600428.2609622","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 37th international ACM SIGIR conference on Research &amp; development in information retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8100000023841858,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320308943","display_name":"Microsoft Research","ror":"https://ror.org/00d0nc645"},{"id":"https://openalex.org/F4320325536","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W93881433","https://openalex.org/W199018803","https://openalex.org/W1514154358","https://openalex.org/W1551409364","https://openalex.org/W1575181818","https://openalex.org/W1654045153","https://openalex.org/W1777547826","https://openalex.org/W1916169864","https://openalex.org/W1997538087","https://openalex.org/W1997599838","https://openalex.org/W2010392031","https://openalex.org/W2044030465","https://openalex.org/W2047622036","https://openalex.org/W2050050080","https://openalex.org/W2057786281","https://openalex.org/W2068130800","https://openalex.org/W2079251416","https://openalex.org/W2079968649","https://openalex.org/W2095277595","https://openalex.org/W2098249418","https://openalex.org/W2100002341","https://openalex.org/W2100495367","https://openalex.org/W2111215091","https://openalex.org/W2112280478","https://openalex.org/W2116064496","https://openalex.org/W2123660869","https://openalex.org/W2129264959","https://openalex.org/W2147152072","https://openalex.org/W2149945051","https://openalex.org/W2158246688","https://openalex.org/W2251969930","https://openalex.org/W2913739034","https://openalex.org/W2913932916"],"related_works":["https://openalex.org/W2161008081","https://openalex.org/W4298186509","https://openalex.org/W2556702969","https://openalex.org/W217221262","https://openalex.org/W611030372","https://openalex.org/W1974418053","https://openalex.org/W2021532426","https://openalex.org/W2530486443","https://openalex.org/W2081317458","https://openalex.org/W2228086542"],"abstract_inverted_index":{"For":[0],"many":[1],"languages":[2],"that":[3],"use":[4],"non-Roman":[5],"based":[6],"indigenous":[7],"scripts":[8,145],"(e.g.,":[9],"Arabic,":[10],"Greek":[11],"and":[12,103,117,137,153,197],"Indic":[13],"languages)":[14],"one":[15,45],"can":[16,154],"often":[17],"find":[18],"a":[19,37,128,150,158],"large":[20],"amount":[21],"of":[22,100,106,110,122,168,182],"user":[23],"generated":[24],"transliterated":[25,86],"content":[26,35,87],"on":[27],"the":[28,31,52,57,67,70,78,83,98,107,115,120,133,141,144,169,174,186],"Web":[29],"in":[30,56,65,81,149,157,177,195,200],"Roman":[32,71],"script.":[33],"Such":[34],"creates":[36],"monolingual":[38],"or":[39,69],"multi-lingual":[40],"space":[41,59],"with":[42,173],"more":[43],"than":[44],"script":[46,72],"which":[47],"we":[48,95],"refer":[49],"to":[50,74,77,131,203],"as":[51],"Mixed-Script":[53,101],"space.":[54,161],"IR":[55,184],"mixed-script":[58,134,183],"is":[60],"challenging":[61],"because":[62],"queries":[63],"written":[64,80],"either":[66],"native":[68],"need":[73],"be":[75,155],"matched":[76],"documents":[79],"both":[82],"scripts.":[84],"Moreover,":[85],"features":[88],"extensive":[89,165],"spelling":[90,138],"variations.":[91],"In":[92],"this":[93,123],"paper,":[94],"formally":[96],"introduce":[97],"concept":[99],"IR,":[102],"through":[104],"analysis":[105,167],"query":[108],"logs":[109],"Bing":[111],"search":[112],"engine,":[113],"estimate":[114],"prevalence":[116],"thereby":[118],"establish":[119],"importance":[121],"problem.":[124],"We":[125,162],"also":[126],"give":[127],"principled":[129],"solution":[130],"handle":[132],"term":[135],"matching":[136],"variation":[139],"where":[140,185],"terms":[142],"across":[143],"are":[146],"modelled":[147],"jointly":[148],"deep-learning":[151],"architecture":[152],"compared":[156,202],"low-dimensional":[159],"abstract":[160],"present":[163],"an":[164,178],"empirical":[166],"proposed":[170,187],"method":[171,188],"along":[172],"evaluation":[175],"results":[176,192],"ad-hoc":[179],"retrieval":[180],"setting":[181],"achieves":[189],"significantly":[190],"better":[191],"(12%":[193],"increase":[194,199],"MRR":[196],"29%":[198],"MAP)":[201],"other":[204],"state-of-the-art":[205],"baselines.":[206]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":12},{"year":2017,"cited_by_count":10},{"year":2016,"cited_by_count":22},{"year":2015,"cited_by_count":14},{"year":2014,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
