{"id":"https://openalex.org/W2159676500","doi":"https://doi.org/10.1145/2382616.2382621","title":"Exploiting External Collections for Query Expansion","display_name":"Exploiting External Collections for Query Expansion","publication_year":2012,"publication_date":"2012-11-01","ids":{"openalex":"https://openalex.org/W2159676500","doi":"https://doi.org/10.1145/2382616.2382621","mag":"2159676500"},"language":"en","primary_location":{"id":"doi:10.1145/2382616.2382621","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2382616.2382621","pdf_url":null,"source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071682310","display_name":"Wouter Weerkamp","orcid":null},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Wouter Weerkamp","raw_affiliation_strings":["University of Amsterdam"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059926999","display_name":"Krisztian Balog","orcid":"https://orcid.org/0000-0003-2762-721X"},"institutions":[{"id":"https://openalex.org/I4210165875","display_name":"NTNU Samfunnsforskning","ror":"https://ror.org/05pv30e80","country_code":"NO","type":"facility","lineage":["https://openalex.org/I4210165875"]}],"countries":["NO"],"is_corresponding":false,"raw_author_name":"Krisztian Balog","raw_affiliation_strings":["NTNU Trondheim"],"affiliations":[{"raw_affiliation_string":"NTNU Trondheim","institution_ids":["https://openalex.org/I4210165875"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031439294","display_name":"Maarten de Rijke","orcid":"https://orcid.org/0000-0002-1086-0202"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Maarten de Rijke","raw_affiliation_strings":["University of Amsterdam"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam","institution_ids":["https://openalex.org/I887064364"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5071682310"],"corresponding_institution_ids":["https://openalex.org/I887064364"],"apc_list":null,"apc_paid":null,"fwci":3.9779,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.93908077,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"6","issue":"4","first_page":"1","last_page":"29"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8412680625915527},{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.8309465050697327},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.7359492182731628},{"id":"https://openalex.org/keywords/encyclopedia","display_name":"Encyclopedia","score":0.5616358518600464},{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.5461760759353638},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.5371677875518799},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.5321962833404541},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5189899802207947},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.5040480494499207},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.48862773180007935},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.45644575357437134},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4396204948425293},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.24552232027053833},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.1713353395462036}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8412680625915527},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.8309465050697327},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.7359492182731628},{"id":"https://openalex.org/C148863701","wikidata":"https://www.wikidata.org/wiki/Q5292","display_name":"Encyclopedia","level":2,"score":0.5616358518600464},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.5461760759353638},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.5371677875518799},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.5321962833404541},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5189899802207947},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.5040480494499207},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.48862773180007935},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.45644575357437134},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4396204948425293},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.24552232027053833},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.1713353395462036},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C161191863","wikidata":"https://www.wikidata.org/wiki/Q199655","display_name":"Library science","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/2382616.2382621","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2382616.2382621","pdf_url":null,"source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},{"id":"pmh:oai:dare.uva.nl:openaire_cris_publications/72964552-b11f-44ba-9951-2579584e6e6e","is_oa":false,"landing_page_url":"https://dare.uva.nl/personal/pure/en/publications/exploiting-external-collections-for-query-expansion(72964552-b11f-44ba-9951-2579584e6e6e).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Weerkamp, W, Balog, K & de Rijke, M 2012, 'Exploiting External Collections for Query Expansion', ACM Transactions on the Web, vol. 6, no. 4, pp. 18. https://doi.org/10.1145/2382616.2382621","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.423.2931","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.423.2931","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://krisztianbalog.com/files/tweb2012-external.pdf","raw_type":"text"},{"id":"pmh:oai:dare.uva.nl:publications/72964552-b11f-44ba-9951-2579584e6e6e","is_oa":false,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/exploiting-external-collections-for-query-expansion(72964552-b11f-44ba-9951-2579584e6e6e).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Weerkamp, W, Balog, K & de Rijke, M 2012, 'Exploiting External Collections for Query Expansion', ACM Transactions on the Web, vol. 6, no. 4, pp. 18. https://doi.org/10.1145/2382616.2382621","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G5969595699","display_name":null,"funder_award_id":"nr 258191 (PROMISE)","funder_id":"https://openalex.org/F4320334960","funder_display_name":"Seventh Framework Programme"},{"id":"https://openalex.org/G701973873","display_name":null,"funder_award_id":"nrs 612.061.814623.061.815640.004.802380-70-011727.011.005612.001.116","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321800","display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek","ror":"https://ror.org/04jsz6e67"},{"id":"https://openalex.org/F4320334960","display_name":"Seventh Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W26119036","https://openalex.org/W143775383","https://openalex.org/W160659377","https://openalex.org/W223477476","https://openalex.org/W343173671","https://openalex.org/W1483313504","https://openalex.org/W1484772416","https://openalex.org/W1503333931","https://openalex.org/W1532325895","https://openalex.org/W1536077504","https://openalex.org/W1557207628","https://openalex.org/W1563804946","https://openalex.org/W1572945832","https://openalex.org/W1592871157","https://openalex.org/W1596258944","https://openalex.org/W1601407209","https://openalex.org/W1605510967","https://openalex.org/W1660390307","https://openalex.org/W1711590747","https://openalex.org/W1828972360","https://openalex.org/W1898200041","https://openalex.org/W1951029750","https://openalex.org/W1969949308","https://openalex.org/W1987996059","https://openalex.org/W1994401877","https://openalex.org/W2019973434","https://openalex.org/W2050095925","https://openalex.org/W2052088591","https://openalex.org/W2057844097","https://openalex.org/W2066698827","https://openalex.org/W2070740689","https://openalex.org/W2083808574","https://openalex.org/W2093390569","https://openalex.org/W2095368471","https://openalex.org/W2098647075","https://openalex.org/W2099871636","https://openalex.org/W2101196063","https://openalex.org/W2102563107","https://openalex.org/W2104049510","https://openalex.org/W2108743173","https://openalex.org/W2114512077","https://openalex.org/W2124906298","https://openalex.org/W2127452535","https://openalex.org/W2127492100","https://openalex.org/W2131133093","https://openalex.org/W2150409425","https://openalex.org/W2153870588","https://openalex.org/W2155030693","https://openalex.org/W2155467656","https://openalex.org/W2161722485","https://openalex.org/W2164547069","https://openalex.org/W2166282252","https://openalex.org/W2169213601","https://openalex.org/W2768581363","https://openalex.org/W2915595141","https://openalex.org/W4206765718","https://openalex.org/W4213009331","https://openalex.org/W4246858749"],"related_works":["https://openalex.org/W2572349046","https://openalex.org/W2096359267","https://openalex.org/W2026738364","https://openalex.org/W4256058599","https://openalex.org/W3197639690","https://openalex.org/W2124814993","https://openalex.org/W2017989738","https://openalex.org/W1981131819","https://openalex.org/W8514837","https://openalex.org/W2186703450"],"abstract_inverted_index":{"A":[0],"persisting":[1],"challenge":[2],"in":[3,195],"the":[4,10,19,37,42,102,172,180,183,222,228,245,269,279,290],"field":[5],"of":[6,24,123,171,185,230,244,272],"information":[7,16],"retrieval":[8,188,287],"is":[9,28,113],"vocabulary":[11],"mismatch":[12],"between":[13],"a":[14,88,144,163,199,203,210,295],"user\u2019s":[15],"need":[17],"and":[18,40,52,57,78,128,189,208,239,260],"relevant":[20],"documents.":[21],"One":[22],"way":[23],"addressing":[25],"this":[26,84],"issue":[27],"to":[29,33,36,68,80,147,179,252],"apply":[30],"query":[31,39,60,73,91,118,219],"modeling:":[32],"add":[34],"terms":[35,161],"original":[38],"reweigh":[41],"terms.":[43],"In":[44,83],"social":[45],"media,":[46],"where":[47],"documents":[48],"usually":[49],"contain":[50],"creative":[51],"noisy":[53],"language":[54],"(e.g.,":[55],"spelling":[56],"grammatical":[58],"errors),":[59],"modeling":[61,74],"proves":[62],"difficult.":[63],"To":[64],"address":[65],"this,":[66],"attempts":[67],"use":[69,191,264],"external":[70,96,124,173,193],"sources":[71],"for":[72,99,126,135,142,152,168],"have":[75],"been":[76],"made":[77],"seem":[79],"be":[81,148],"successful.":[82],"article":[85],"we":[86,140,155,190,263,267],"propose":[87],"general":[89,164],"generative":[90],"expansion":[92,127,131,220],"model":[93,112,132,178],"that":[94,116,129,216,233,248,278],"uses":[95],"document":[97],"collections":[98,125,194],"term":[100],"generation:":[101],"External":[103],"Expansion":[104],"Model":[105],"(EEM).":[106],"The":[107],"main":[108],"rationale":[109],"behind":[110],"our":[111,114,177,196,249,273],"hypothesis":[115],"each":[117],"requires":[119],"its":[120],"own":[121],"mixture":[122],"an":[130],"should":[133],"account":[134],"this.":[136],"For":[137],"some":[138],"queries":[139,154],"expect,":[141],"example,":[143],"news":[145,200],"collection":[146,255,281,292,296],"most":[149],"beneficial,":[150],"while":[151],"other":[153],"could":[156],"benefit":[157],"more":[158,284],"by":[159,237],"selecting":[160],"from":[162],"encyclopedia.":[165],"EEM":[166,217],"allows":[167],"query-dependent":[169,254,280],"weighing":[170],"collections.":[174],"We":[175,275],"put":[176],"test":[181],"on":[182,221,286],"task":[184],"blog":[186,211],"post":[187,212],"four":[192],"experiments:":[197],"(i)":[198],"collection,":[201,205],"(ii)":[202],"Web":[204],"(iii)":[206],"Wikipedia,":[207],"(iv)":[209],"collection.":[213],"Experiments":[214],"show":[215],"outperforms":[218],"individual":[223],"collections,":[224],"as":[225,227],"well":[226,259],"Mixture":[229],"Relevance":[231],"Models":[232],"was":[234],"previously":[235],"proposed":[236],"Diaz":[238],"Metzler":[240],"[2006].":[241],"Extensive":[242],"analysis":[243],"results":[246],"shows":[247],"naive":[250],"approach":[251],"estimating":[253],"importance":[256,282,293],"works":[257],"reasonably":[258],"that,":[261],"when":[262],"\u201coracle\u201d":[265],"settings,":[266],"see":[268],"full":[270],"potential":[271],"model.":[274],"also":[276],"find":[277],"has":[283],"impact":[285],"performance":[288],"than":[289],"independent":[291],"(i.e.,":[294],"prior).":[297]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
