{"id":"https://openalex.org/W4406931868","doi":"https://doi.org/10.48550/arxiv.2501.16302","title":"Matryoshka Re-Ranker: A Flexible Re-Ranking Architecture With Configurable Depth and Width","display_name":"Matryoshka Re-Ranker: A Flexible Re-Ranking Architecture With Configurable Depth and Width","publication_year":2025,"publication_date":"2025-01-27","ids":{"openalex":"https://openalex.org/W4406931868","doi":"https://doi.org/10.48550/arxiv.2501.16302"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2501.16302","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.16302","pdf_url":"https://arxiv.org/pdf/2501.16302","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.16302","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100423680","display_name":"Zheng Liu","orcid":"https://orcid.org/0000-0002-2879-5859"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Liu, Zheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065277920","display_name":"Chaofan Li","orcid":"https://orcid.org/0000-0002-1859-8392"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chaofan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044147794","display_name":"Shitao Xiao","orcid":"https://orcid.org/0000-0003-2567-6843"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Shitao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037831162","display_name":"Chaozhuo Li","orcid":"https://orcid.org/0000-0002-9867-1712"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chaozhuo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085254654","display_name":"Defu Lian","orcid":"https://orcid.org/0000-0002-3507-9607"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lian, Defu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5014615052","display_name":"Yingxia Shao","orcid":"https://orcid.org/0000-0002-8559-2628"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Yingxia","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100423680"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.3711000084877014,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.3711000084877014,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7155717015266418},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.6472660303115845},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5437728762626648},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.41342905163764954},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36067289113998413},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.1759355068206787}],"concepts":[{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7155717015266418},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.6472660303115845},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5437728762626648},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.41342905163764954},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36067289113998413},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.1759355068206787},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2501.16302","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.16302","pdf_url":"https://arxiv.org/pdf/2501.16302","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.16302","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.16302","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.16302","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.16302","pdf_url":"https://arxiv.org/pdf/2501.16302","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4406931868.pdf","grobid_xml":"https://content.openalex.org/works/W4406931868.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2038503502"],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"provide":[4],"powerful":[5],"foundations":[6],"to":[7,20,39,89,102,142],"perform":[8,158],"fine-grained":[9],"text":[10],"re-ranking.":[11],"However,":[12],"they":[13],"are":[14,139],"often":[15],"prohibitive":[16],"in":[17],"reality":[18],"due":[19],"constraints":[21],"on":[22,53,162],"computation":[23],"bandwidth.":[24],"In":[25,179],"this":[26,81],"work,":[27],"we":[28,83,94,124],"propose":[29,95],"a":[30,85,104,126],"\\textbf{flexible}":[31],"architecture":[32],"called":[33],"\\textbf{Matroyshka":[34],"Re-Ranker},":[35],"which":[36],"is":[37],"designed":[38],"facilitate":[40],"\\textbf{runtime":[41],"customization}":[42],"of":[43,76,87,152,198],"model":[44],"layers":[45],"and":[46,119,137,154,165,200],"sequence":[47,155],"lengths":[48],"at":[49,73],"each":[50,99],"layer":[51,153],"based":[52,161],"users'":[54],"configurations.":[55],"Consequently,":[56],"the":[57,74,91,145,163,186],"LLM-based":[58],"re-rankers":[59],"can":[60,114],"be":[61,115],"made":[62],"applicable":[63],"across":[64,195],"various":[65,196],"real-world":[66],"situations.":[67],"The":[68],"increased":[69],"flexibility":[70],"may":[71],"come":[72],"cost":[75],"precision":[77,146],"loss.":[78],"To":[79],"address":[80],"problem,":[82],"introduce":[84],"suite":[86],"techniques":[88],"optimize":[90],"performance.":[92],"First,":[93],"\\textbf{cascaded":[96],"self-distillation},":[97],"where":[98,130],"sub-architecture":[100],"learns":[101],"preserve":[103],"precise":[105],"re-ranking":[106],"performance":[107,194],"from":[108,149,169,176],"its":[109,192],"super":[110],"components,":[111],"whose":[112],"predictions":[113],"exploited":[116],"as":[117],"smooth":[118],"informative":[120],"teacher":[121],"signals.":[122],"Second,":[123],"design":[125],"\\textbf{factorized":[127],"compensation":[128],"mechanism},":[129],"two":[131],"collaborative":[132],"Low-Rank":[133],"Adaptation":[134],"modules,":[135],"vertical":[136],"horizontal,":[138],"jointly":[140],"employed":[141],"compensate":[143],"for":[144],"loss":[147],"resulted":[148],"arbitrary":[150],"combinations":[151],"compression.":[156],"We":[157],"comprehensive":[159],"experiments":[160],"passage":[164],"document":[166],"retrieval":[167],"datasets":[168,175],"MSMARCO,":[170],"along":[171],"with":[172],"all":[173],"public":[174],"BEIR":[177],"benchmark.":[178],"our":[180],"experiments,":[181],"Matryoshka":[182],"Re-Ranker":[183],"substantially":[184],"outperforms":[185],"existing":[187],"methods,":[188],"while":[189],"effectively":[190],"preserving":[191],"superior":[193],"forms":[197],"compression":[199],"different":[201],"application":[202],"scenarios.":[203]},"counts_by_year":[],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
