{"id":"https://openalex.org/W7106676899","doi":"https://doi.org/10.48550/arxiv.2511.19325","title":"Generative Query Expansion with Multilingual LLMs for Cross-Lingual Information Retrieval","display_name":"Generative Query Expansion with Multilingual LLMs for Cross-Lingual Information Retrieval","publication_year":2025,"publication_date":"2025-11-24","ids":{"openalex":"https://openalex.org/W7106676899","doi":"https://doi.org/10.48550/arxiv.2511.19325"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2511.19325","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19325","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2511.19325","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Macmillan-Scott, Olivia","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Macmillan-Scott, Olivia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Goworek, Roksana","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goworek, Roksana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"\u00d6zyi\u011fit, Eda B.","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"\u00d6zyi\u011fit, Eda B.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0008999999845400453,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.0005000000237487257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.8173999786376953},{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.5989999771118164},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.51910001039505},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.48249998688697815},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.42910000681877136},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.4284999966621399},{"id":"https://openalex.org/keywords/multilingualism","display_name":"Multilingualism","score":0.4072999954223633},{"id":"https://openalex.org/keywords/rdf-query-language","display_name":"RDF query language","score":0.40130001306533813}],"concepts":[{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.8173999786376953},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7662000060081482},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.5989999771118164},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5550000071525574},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.51910001039505},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.48249998688697815},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.42910000681877136},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.4284999966621399},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4156999886035919},{"id":"https://openalex.org/C2780035574","wikidata":"https://www.wikidata.org/wiki/Q30081","display_name":"Multilingualism","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C96956885","wikidata":"https://www.wikidata.org/wiki/Q6138701","display_name":"RDF query language","level":5,"score":0.40130001306533813},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3921999931335449},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.3700999915599823},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.3230000138282776},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.30070000886917114},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.3005000054836273},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.28769999742507935},{"id":"https://openalex.org/C2778842860","wikidata":"https://www.wikidata.org/wiki/Q986551","display_name":"Cross-language information retrieval","level":3,"score":0.2809000015258789},{"id":"https://openalex.org/C41009113","wikidata":"https://www.wikidata.org/wiki/Q54871","display_name":"SPARQL","level":4,"score":0.2689000070095062},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2635999917984009}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2511.19325","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19325","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2511.19325","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19325","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Query":[0],"expansion":[1,43,89,128],"is":[2,15,72,109,142,152],"the":[3,63,131,137,161,173],"reformulation":[4],"of":[5,19,167],"a":[6],"user":[7],"query":[8,42,102,127],"by":[9],"adding":[10],"semantically":[11],"related":[12,50],"information,":[13],"and":[14,21,49,61,68,83,111,163,179,182],"an":[16],"essential":[17],"component":[18],"monolingual":[20],"cross-lingual":[22,96,126,180],"information":[23],"retrieval":[24,97,141],"used":[25],"to":[26,52,91,154,156],"ensure":[27],"that":[28,94,101,112],"relevant":[29,59],"documents":[30],"are":[31,166],"not":[32,118],"missed.":[33],"Recently,":[34],"multilingual":[35,178],"large":[36],"language":[37],"models":[38],"(mLLMs)":[39],"have":[40],"shifted":[41],"from":[44],"semantic":[45],"augmentation":[46],"with":[47,136],"synonyms":[48],"words":[51],"pseudo-document":[53],"generation.":[54],"Pseudo-documents":[55],"both":[56],"introduce":[57],"additional":[58],"terms":[60],"bridge":[62],"gap":[64],"between":[65,145],"short":[66],"queries":[67],"long":[69],"documents,":[70],"which":[71,106],"particularly":[73],"beneficial":[74],"in":[75,148],"dense":[76],"retrieval.":[77],"This":[78],"study":[79],"evaluates":[80],"recent":[81],"mLLMs":[82],"fine-tuned":[84],"variants":[85],"across":[86],"several":[87],"generative":[88],"strategies":[90],"identify":[92],"factors":[93],"drive":[95],"performance.":[98],"Results":[99],"show":[100],"length":[103],"largely":[104],"determines":[105],"prompting":[107],"technique":[108],"effective,":[110],"more":[113,176],"elaborate":[114],"prompts":[115],"often":[116],"do":[117],"yield":[119],"further":[120],"gains.":[121],"Substantial":[122],"linguistic":[123],"disparities":[124],"persist:":[125],"can":[129],"produce":[130],"largest":[132],"improvements":[133],"for":[134,175],"languages":[135,146],"weakest":[138],"baselines,":[139],"yet":[140],"especially":[143],"poor":[144],"written":[147],"different":[149],"scripts.":[150],"Fine-tuning":[151],"found":[153],"lead":[155],"performance":[157],"gains":[158],"only":[159],"when":[160],"training":[162,181],"test":[164],"data":[165],"similar":[168],"format.":[169],"These":[170],"outcomes":[171],"underline":[172],"need":[174],"balanced":[177],"evaluation":[183],"resources.":[184]},"counts_by_year":[],"updated_date":"2025-11-27T01:16:37.896743","created_date":"2025-11-27T00:00:00"}
