{"id":"https://openalex.org/W4414244615","doi":"https://doi.org/10.14778/3750601.3750625","title":"R-Bot: An LLM-Based Query Rewrite System","display_name":"R-Bot: An LLM-Based Query Rewrite System","publication_year":2025,"publication_date":"2025-08-01","ids":{"openalex":"https://openalex.org/W4414244615","doi":"https://doi.org/10.14778/3750601.3750625"},"language":"en","primary_location":{"id":"doi:10.14778/3750601.3750625","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3750601.3750625","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053352268","display_name":"Zhaoyan Sun","orcid":"https://orcid.org/0009-0000-2688-4981"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaoyan Sun","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056912386","display_name":"Xuanhe Zhou","orcid":"https://orcid.org/0000-0002-2285-7836"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuanhe Zhou","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119268361","display_name":"Guoliang Li","orcid":"https://orcid.org/0009-0007-8430-5141"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guoliang Li","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101426810","display_name":"Xiang Yu","orcid":"https://orcid.org/0000-0001-9431-5131"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiang Yu","raw_affiliation_strings":["Huawei Company"],"affiliations":[{"raw_affiliation_string":"Huawei Company","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100951661","display_name":"Jianhua Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhua Feng","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100419741","display_name":"Yong Zhang","orcid":"https://orcid.org/0000-0001-8803-2055"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Zhang","raw_affiliation_strings":["Tsinghua University"],"affiliations":[{"raw_affiliation_string":"Tsinghua University","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5053352268"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.6666,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.88325142,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"18","issue":"12","first_page":"5031","last_page":"5044"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10400","display_name":"Network Security and Intrusion Detection","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9751999974250793,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9743000268936157,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.6409000158309937},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.6074000000953674},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5443000197410583},{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.5335000157356262},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5228000283241272},{"id":"https://openalex.org/keywords/sargable","display_name":"Sargable","score":0.49570000171661377},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4894999861717224},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4699999988079071},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.4456000030040741}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8396999835968018},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.6409000158309937},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.6074000000953674},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5443000197410583},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.5335000157356262},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5228000283241272},{"id":"https://openalex.org/C192939062","wikidata":"https://www.wikidata.org/wiki/Q104840822","display_name":"Sargable","level":4,"score":0.49570000171661377},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4894999861717224},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4699999988079071},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.4456000030040741},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4059000015258789},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.38359999656677246},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.37130001187324524},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3228999972343445},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.32019999623298645},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.29319998621940613},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.28690001368522644},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.28630000352859497},{"id":"https://openalex.org/C65647387","wikidata":"https://www.wikidata.org/wiki/Q1781706","display_name":"Conjunctive query","level":3,"score":0.27869999408721924},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.27630001306533813},{"id":"https://openalex.org/C96956885","wikidata":"https://www.wikidata.org/wiki/Q6138701","display_name":"RDF query language","level":5,"score":0.27619999647140503},{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.271699994802475},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26589998602867126},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.26570001244544983},{"id":"https://openalex.org/C174252522","wikidata":"https://www.wikidata.org/wiki/Q3816772","display_name":"Natural language user interface","level":3,"score":0.2583000063896179},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3750601.3750625","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3750601.3750625","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W135863099","https://openalex.org/W2136195851","https://openalex.org/W2970641574","https://openalex.org/W3196849431","https://openalex.org/W3207801254","https://openalex.org/W4205381461","https://openalex.org/W4221143046","https://openalex.org/W4281787155","https://openalex.org/W4283326127","https://openalex.org/W4289866538","https://openalex.org/W4291713239","https://openalex.org/W4383605243","https://openalex.org/W4386123427","https://openalex.org/W4386128181","https://openalex.org/W4386768432","https://openalex.org/W4389609814","https://openalex.org/W4391032878","https://openalex.org/W4392453910","https://openalex.org/W4394745858","https://openalex.org/W4399208444","https://openalex.org/W4401352024","https://openalex.org/W4402042542","https://openalex.org/W4402043038","https://openalex.org/W4404181035","https://openalex.org/W4404181272","https://openalex.org/W4404181362","https://openalex.org/W4407385475","https://openalex.org/W4411374555","https://openalex.org/W4411403466"],"related_works":[],"abstract_inverted_index":{"Query":[0],"rewrite":[1,94,105,112,139,153,165,193],"is":[2],"essential":[3],"for":[4,114,141],"optimizing":[5],"SQL":[6],"queries":[7],"to":[8,70,109,117,134,161],"improve":[9],"their":[10,15,50,59],"execution":[11],"efficiency":[12],"without":[13],"changing":[14],"results.":[16,83],"Traditionally,":[17],"this":[18],"task":[19],"has":[20,66,198],"been":[21,199],"tackled":[22],"through":[23],"heuristic":[24],"and":[25,37,54,131,163,176,180,203,207],"learning-based":[26],"methods,":[27],"each":[28],"with":[29,96,167,204],"its":[30],"limitations":[31],"in":[32,42],"terms":[33],"of":[34,185],"inferior":[35],"quality":[36],"low":[38],"robustness.":[39],"Recent":[40],"advancements":[41],"LLMs":[43,63,116],"offer":[44],"a":[45,97,103,123,150],"new":[46],"paradigm":[47],"by":[48],"leveraging":[49],"superior":[51,183],"natural":[52],"language":[53],"code":[55],"comprehension":[56],"abilities.":[57],"Despite":[58],"potential,":[60],"directly":[61],"applying":[62],"like":[64],"GPT-4":[65],"faced":[67],"challenges":[68],"due":[69],"problems":[71],"such":[72],"as":[73],"hallucinations,":[74],"where":[75],"the":[76,136,158,182,208,212],"model":[77],"might":[78],"generate":[79,110],"inaccurate":[80],"or":[81],"irrelevant":[82],"To":[84],"address":[85],"this,":[86],"we":[87],"propose":[88,122,149],"R-Bot":[89,188,196,214],",":[90,189],"an":[91,144],"LLM-based":[92],"query":[93,111,192,218],"system":[95,197,215],"systematic":[98],"approach.":[99],"We":[100,120,147,169],"first":[101],"design":[102],"multi-source":[104],"evidence":[106],"preparation":[107],"pipeline":[108],"evidences":[113,140,160],"guiding":[115],"avoid":[118],"hallucinations.":[119],"then":[121],"hybrid":[124],"structure-semantics":[125],"retrieval":[126],"method":[127,154],"that":[128,155,211],"combines":[129],"structural":[130],"semantic":[132],"analysis":[133],"retrieve":[135],"most":[137],"relevant":[138],"effectively":[142],"answering":[143],"online":[145],"query.":[146],"next":[148],"step-by-step":[151],"LLM":[152],"iteratively":[156],"leverages":[157],"retrieved":[159],"select":[162],"arrange":[164],"rules":[166],"self-reflection.":[168],"conduct":[170],"comprehensive":[171],"experiments":[172],"on":[173],"real-world":[174],"datasets":[175],"widely":[177],"used":[178],"benchmarks,":[179],"demonstrate":[181],"performance":[184],"our":[186],"system,":[187],"surpassing":[190],"state-of-the-art":[191],"methods.":[194],"The":[195],"deployed":[200],"at":[201],"Huawei":[202],"real":[205],"customers,":[206],"results":[209],"show":[210],"proposed":[213],"achieves":[216],"lower":[217],"latency.":[219]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
