{"id":"https://openalex.org/W4416667642","doi":"https://doi.org/10.48550/arxiv.2511.17044","title":"Parametric Retrieval-Augmented Generation using Latent Routing of LoRA Adapters","display_name":"Parametric Retrieval-Augmented Generation using Latent Routing of LoRA Adapters","publication_year":2025,"publication_date":"2025-11-21","ids":{"openalex":"https://openalex.org/W4416667642","doi":"https://doi.org/10.48550/arxiv.2511.17044"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2511.17044","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.17044","pdf_url":"https://arxiv.org/pdf/2511.17044","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2511.17044","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100650130","display_name":"Zhan Su","orcid":"https://orcid.org/0000-0002-2310-8781"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Zhan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048033573","display_name":"Fengran Mo","orcid":"https://orcid.org/0000-0002-0838-6994"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mo, Fengran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Jinghan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jinghan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Hui, Yuchen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hui, Yuchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Sun, Jiaao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Jiaao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Nie, Jian-yun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nie, Jian-yun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.32420000433921814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.32420000433921814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.11749999970197678,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.1080000028014183,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.8345999717712402},{"id":"https://openalex.org/keywords/adapter","display_name":"Adapter (computing)","score":0.7214000225067139},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.5192999839782715},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5174000263214111},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.47909998893737793},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.47870001196861267},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4708000123500824}],"concepts":[{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.8345999717712402},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7444999814033508},{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.7214000225067139},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.5192999839782715},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5174000263214111},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.47909998893737793},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.47870001196861267},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4708000123500824},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.44839999079704285},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4142000079154968},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C104954878","wikidata":"https://www.wikidata.org/wiki/Q1648707","display_name":"Routing protocol","level":3,"score":0.26030001044273376},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2596000134944916},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2540999948978424},{"id":"https://openalex.org/C184896649","wikidata":"https://www.wikidata.org/wiki/Q290066","display_name":"Routing table","level":4,"score":0.2531000077724457}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2511.17044","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.17044","pdf_url":"https://arxiv.org/pdf/2511.17044","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2511.17044","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.17044","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2511.17044","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.17044","pdf_url":"https://arxiv.org/pdf/2511.17044","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Parametric":[0],"Retrieval-Augmented":[1],"Generation":[2],"(PRAG)":[3],"is":[4,145],"a":[5,17,35,41,65,102,122,127,149,169,202,210],"RAG":[6],"approach":[7,88,191],"that":[8,108],"integrates":[9],"external":[10,216],"knowledge":[11,83,154,217],"directly":[12],"into":[13,218],"model":[14],"parameters":[15],"using":[16,40,121],"LoRA":[18,43,74,106,135,143,206],"adapter,":[19],"aiming":[20],"at":[21],"reducing":[22],"the":[23,57,81,87,97,134,138,153,158,163,177,180,193,198],"inference":[24],"cost":[25,67],"compared":[26,182],"to":[27,80,111,147,183,200,214],"traditional":[28],"RAG.":[29],"However,":[30],"current":[31],"PRAG":[32,186],"approaches":[33],"adopt":[34],"\\textit{one-to-one}":[36],"document":[37,117],"encoding":[38],"scheme,":[39],"dedicated":[42],"adapter":[44,144],"for":[45,68,168],"each":[46,142],"individual":[47],"document.":[48,170],"This":[49],"scheme":[50],"introduces":[51],"two":[52],"major":[53],"limitations:":[54],"1)":[55],"As":[56],"number":[58,204],"of":[59,105,124,152,166,179,205],"documents":[60],"increases,":[61],"there":[62],"will":[63],"be":[64,119],"prohibitive":[66],"training":[69,133],"and":[70,137,157,208],"storage.":[71],"2)":[72],"The":[73],"adapters":[75,107,136,167,207],"may":[76],"largely":[77],"overlap":[78],"due":[79],"shared":[82,150],"across":[84,155],"documents,":[85,156],"making":[86],"highly":[89],"inefficient.":[90],"To":[91],"overcome":[92],"these":[93],"challenges,":[94],"we":[95],"propose":[96],"Poly-PRAG":[98,181],"approach,":[99],"which":[100],"uses":[101],"small":[103],"set":[104],"are":[109],"able":[110,146],"encode":[112,148,215],"more":[113,211],"general":[114],"knowledge.":[115],"Each":[116],"can":[118,161],"encoded":[120],"combination":[123,165],"them":[125],"through":[126],"latent":[128,139],"routing":[129,140,159],"function.":[130],"By":[131],"jointly":[132],"function,":[141],"part":[151],"function":[160],"select":[162],"best":[164],"Experimental":[171],"results":[172],"on":[173],"four":[174],"benchmarks":[175],"demonstrate":[176],"effectiveness":[178],"other":[184],"strong":[185],"baselines.":[187],"In":[188],"addition,":[189],"this":[190],"reduces":[192],"storage":[194],"requirement":[195],"by":[196],"avoiding":[197],"need":[199],"store":[201],"large":[203],"offers":[209],"efficient":[212],"way":[213],"LLMs.":[219]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-25T00:00:00"}
