{"id":"https://openalex.org/W7147270145","doi":"https://doi.org/10.48550/arxiv.2603.26669","title":"ReCQR: Incorporating conversational query rewriting to improve Multimodal Image Retrieval","display_name":"ReCQR: Incorporating conversational query rewriting to improve Multimodal Image Retrieval","publication_year":2026,"publication_date":"2026-01-19","ids":{"openalex":"https://openalex.org/W7147270145","doi":"https://doi.org/10.48550/arxiv.2603.26669"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.26669","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26669","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.26669","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132630674","display_name":"Yuan Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hu, Yuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132609454","display_name":"ZhiYu Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, ZhiYu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125306698","display_name":"Peifeng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, PeiFeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129706159","display_name":"Qiaoming Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, QiaoMing","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5132630674"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9776999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9776999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.007199999876320362,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.0034000000450760126,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rewriting","display_name":"Rewriting","score":0.7666000127792358},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7161999940872192},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.6323000192642212},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5102999806404114},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5098999738693237},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.49470001459121704},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4431000053882599},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.44119998812675476}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.85589998960495},{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.7666000127792358},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7161999940872192},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.6323000192642212},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6315000057220459},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5102999806404114},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5098999738693237},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.49470001459121704},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4431000053882599},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.44119998812675476},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4332999885082245},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.39070001244544983},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3544999957084656},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.3492000102996826},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.3474999964237213},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.33379998803138733},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.28299999237060547},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.26969999074935913}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.26669","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26669","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.26669","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26669","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.729056715965271,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,39,46,111,122,141],"rise":[2],"of":[3,143],"multimodal":[4,108,119,160],"learning,":[5],"image":[6,21,47,130,145],"retrieval":[7,48,146],"plays":[8],"a":[9,52],"crucial":[10],"role":[11],"in":[12,159],"connecting":[13],"visual":[14],"information":[15],"with":[16,24,100],"natural":[17],"language":[18],"queries.":[19],"Existing":[20],"retrievers":[22],"struggle":[23],"processing":[25],"long":[26],"texts":[27],"and":[28,50,94,153],"handling":[29],"unclear":[30],"user":[31,157],"expressions.":[32],"To":[33],"address":[34],"these":[35],"issues,":[36],"we":[37],"introduce":[38],"conversational":[40],"query":[41,56],"rewriting":[42,57],"(CQR)":[43],"task":[44],"into":[45,69],"domain":[49],"construct":[51],"dedicated":[53],"multi-turn":[54],"dialogue":[55,62],"dataset.":[58,113],"Built":[59],"on":[60,121,129],"full":[61],"histories,":[63],"CQR":[64,136],"rewrites":[65],"users'":[66],"final":[67],"queries":[68,158],"concise,":[70],"semantically":[71],"complete":[72],"ones":[73],"that":[74,135],"are":[75],"better":[76],"suited":[77],"for":[78,155],"retrieval.":[79,131],"Specifically,":[80],"We":[81,115],"first":[82],"leverage":[83],"Large":[84],"Language":[85],"Models":[86],"(LLMs)":[87],"to":[88,103,125],"generate":[89],"rewritten":[90],"candidates":[91],"at":[92],"scale":[93],"employ":[95],"an":[96],"LLM-as-Judge":[97],"mechanism":[98],"combined":[99],"manual":[101],"review":[102],"curate":[104],"approximately":[105],"7,000":[106],"high-quality":[107],"dialogues,":[109],"forming":[110],"ReCQR":[112,123],"Then":[114],"benchmark":[116],"several":[117],"SOTA":[118],"models":[120],"dataset":[124],"assess":[126],"their":[127],"performance":[128],"Experimental":[132],"results":[133],"demonstrate":[134],"not":[137],"only":[138],"significantly":[139],"enhances":[140],"accuracy":[142],"traditional":[144],"models,":[147],"but":[148],"also":[149],"provides":[150],"new":[151],"directions":[152],"insights":[154],"modeling":[156],"systems.":[161]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
