{"id":"https://openalex.org/W7162545024","doi":"https://doi.org/10.48550/arxiv.2605.27361","title":"Natural Language Query to Configuration for Retrieval Agents","display_name":"Natural Language Query to Configuration for Retrieval Agents","publication_year":2026,"publication_date":"2026-05-26","ids":{"openalex":"https://openalex.org/W7162545024","doi":"https://doi.org/10.48550/arxiv.2605.27361"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27361","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27361","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27361","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126852859","display_name":"Melissa Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Melissa Z.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049487742","display_name":"Negar Arabzadeh","orcid":"https://orcid.org/0000-0002-4411-7089"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arabzadeh, Negar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137133644","display_name":"Mathew Jacob","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jacob, Mathew","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005485274","display_name":"Fiodar Kazhamiaka","orcid":"https://orcid.org/0000-0002-0798-5151"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kazhamiaka, Fiodar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045708568","display_name":"Esha Choukse","orcid":"https://orcid.org/0000-0003-0371-5522"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choukse, Esha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137162622","display_name":"Matei Zaharia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zaharia, Matei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.8881999850273132,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.8881999850273132,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.02969999983906746,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.015399999916553497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6722999811172485},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6449999809265137},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5935999751091003},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.585099995136261},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.4814000129699707},{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.477400004863739},{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.47609999775886536},{"id":"https://openalex.org/keywords/pareto-principle","display_name":"Pareto principle","score":0.39430001378059387}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8016999959945679},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6722999811172485},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6449999809265137},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5935999751091003},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.585099995136261},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.4814000129699707},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.47760000824928284},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.477400004863739},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.47609999775886536},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.39430001378059387},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37369999289512634},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.37070000171661377},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.3569999933242798},{"id":"https://openalex.org/C24028149","wikidata":"https://www.wikidata.org/wiki/Q7094056","display_name":"Online aggregation","level":5,"score":0.34470000863075256},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.3409000039100647},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3301999866962433},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2782999873161316},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.27239999175071716},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.2712000012397766},{"id":"https://openalex.org/C129916263","wikidata":"https://www.wikidata.org/wiki/Q1141183","display_name":"Backward chaining","level":4,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27361","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27361","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27361","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27361","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modern":[0],"retrieval":[1,167],"agents":[2],"expose":[3],"many":[4],"configuration":[5,65,111,163],"choices":[6],"--":[7,19],"LLM,":[8],"retriever,":[9],"number":[10,13],"of":[11,14,164],"documents,":[12],"hops,":[15],"and":[16,25,50,129,150,154],"synthesis":[17],"strategy":[18],"each":[20,84],"shaping":[21],"both":[22],"answer":[23,101],"quality":[24],"serving":[26],"cost.":[27],"Today,":[28],"these":[29],"pipelines":[30],"are":[31],"typically":[32],"hand-tuned":[33],"once":[34],"per":[35],"workload,":[36],"leaving":[37],"substantial":[38],"per-query":[39,162],"optimization":[40],"untapped.":[41],"We":[42,75],"formulate":[43],"the":[44,64,98,102,110,134,139,165],"problem:":[45],"given":[46],"a":[47,55,60,91,120,170],"natural-language":[48],"query":[49,85,103],"either":[51],"an":[52,80],"accuracy":[53,71,143],"or":[54,69],"budget":[56],"target,":[57],"select":[58],"from":[59],"predefined":[61],"pipeline":[62,99,168],"catalog":[63],"that":[66,95,112,161],"minimizes":[67],"cost":[68],"maximizes":[70,113],"at":[72,144],"inference":[73,106],"time.":[74],"propose":[76],"**BRANE**,":[77],"which":[78],"uses":[79],"LLM":[81],"to":[82,146,173],"convert":[83],"into":[86],"workload-specific":[87],"characteristics,":[88],"then":[89],"trains":[90],"lightweight":[92],"per-configuration":[93],"predictor":[94],"estimates":[96],"whether":[97],"will":[100],"correctly.":[104],"At":[105],"time,":[107],"**BRANE**":[108,131],"selects":[109],"predicted":[114],"correctness":[115],"penalized":[116],"by":[117],"cost,":[118,149],"exposing":[119],"tunable":[121],"cost-quality":[122,135],"tradeoff":[123],"without":[124],"retraining.":[125],"Across":[126],"MuSiQue,":[127],"BrowseComp-Plus,":[128],"FinanceBench,":[130],"consistently":[132],"pushes":[133],"Pareto":[136],"frontier,":[137],"matches":[138],"best":[140],"fixed":[141],"configuration's":[142],"up":[145],"89%":[147],"lower":[148],"outperforms":[151],"LLM-routing,":[152],"rule-based,":[153],"fine-tuned":[155],"Qwen3-4B":[156],"baselines.":[157],"These":[158],"results":[159],"show":[160],"full":[166],"is":[169],"practical":[171],"alternative":[172],"static":[174],"workload-level":[175],"tuning.":[176]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
