{"id":"https://openalex.org/W4390268206","doi":"https://doi.org/10.1007/s00778-023-00831-y","title":"DB-BERT: making database tuning tools \u201cread\u201d the manual","display_name":"DB-BERT: making database tuning tools \u201cread\u201d the manual","publication_year":2023,"publication_date":"2023-12-27","ids":{"openalex":"https://openalex.org/W4390268206","doi":"https://doi.org/10.1007/s00778-023-00831-y"},"language":"en","primary_location":{"id":"doi:10.1007/s00778-023-00831-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00778-023-00831-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00778-023-00831-y.pdf","source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00778-023-00831-y.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087259526","display_name":"Immanuel Trummer","orcid":"https://orcid.org/0000-0002-7203-2349"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Immanuel Trummer","raw_affiliation_strings":["Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5087259526"],"corresponding_institution_ids":["https://openalex.org/I205783295"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":{"value":2290,"currency":"EUR","value_usd":2890},"fwci":0.5185,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.73336365,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"33","issue":"4","first_page":"1085","last_page":"1104"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8767591118812561},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7821310758590698},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6717804074287415},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5735036730766296},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.5609092712402344},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5154320001602173},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5089514255523682},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4696074426174164},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.39687004685401917},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33942657709121704},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3240281939506531},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1444193422794342},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14402025938034058},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.07863837480545044}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8767591118812561},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7821310758590698},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6717804074287415},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5735036730766296},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5609092712402344},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5154320001602173},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5089514255523682},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4696074426174164},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.39687004685401917},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33942657709121704},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3240281939506531},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1444193422794342},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14402025938034058},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.07863837480545044},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00778-023-00831-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00778-023-00831-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00778-023-00831-y.pdf","source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00778-023-00831-y","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00778-023-00831-y","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00778-023-00831-y.pdf","source":{"id":"https://openalex.org/S78926909","display_name":"The VLDB Journal","issn_l":"0949-877X","issn":["0949-877X","1066-8888"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The VLDB Journal","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5199999809265137}],"awards":[{"id":"https://openalex.org/G6671297155","display_name":null,"funder_award_id":"CAREER","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7093577988","display_name":null,"funder_award_id":"2239326","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390268206.pdf"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W1628341315","https://openalex.org/W1997783781","https://openalex.org/W2396309311","https://openalex.org/W2536574992","https://openalex.org/W2613206411","https://openalex.org/W2746553466","https://openalex.org/W2889503624","https://openalex.org/W2890431379","https://openalex.org/W2944240329","https://openalex.org/W2945102109","https://openalex.org/W2948513753","https://openalex.org/W2963026768","https://openalex.org/W2963748441","https://openalex.org/W2963853546","https://openalex.org/W2964915587","https://openalex.org/W2970148517","https://openalex.org/W2970851599","https://openalex.org/W2979826702","https://openalex.org/W3020084632","https://openalex.org/W3029327553","https://openalex.org/W3035140194","https://openalex.org/W3084740534","https://openalex.org/W3095319910","https://openalex.org/W3098304379","https://openalex.org/W3099273181","https://openalex.org/W3100925961","https://openalex.org/W3103801878","https://openalex.org/W3139827290","https://openalex.org/W3148437589","https://openalex.org/W3150554837","https://openalex.org/W3165814564","https://openalex.org/W3173850788","https://openalex.org/W3208735199","https://openalex.org/W4281754544","https://openalex.org/W4281972940","https://openalex.org/W4285335450","https://openalex.org/W4312537169","https://openalex.org/W4312903631","https://openalex.org/W4380433215","https://openalex.org/W4386123453","https://openalex.org/W4389315083","https://openalex.org/W4389539730","https://openalex.org/W6600388300","https://openalex.org/W6605450533"],"related_works":["https://openalex.org/W17155033","https://openalex.org/W3207760230","https://openalex.org/W1496222301","https://openalex.org/W1590307681","https://openalex.org/W4312814274","https://openalex.org/W4285370786","https://openalex.org/W2296488620","https://openalex.org/W2358353312","https://openalex.org/W2353836703","https://openalex.org/W4386541577"],"abstract_inverted_index":{"Abstract":[0],"DB-BERT":[1,38,73,140,168,193],"is":[2,194],"a":[3,86],"database":[4,27,88,113,132,158,175],"tuning":[5,105,133],"tool":[6],"that":[7,111,119,167],"exploits":[8],"information":[9,173],"gained":[10,184],"via":[11,185],"natural":[12,64],"language":[13,42,65],"analysis":[14],"of":[15,104,128,192],"manuals":[16],"and":[17,78,90,96,148,152,161],"other":[18],"relevant":[19],"text":[20,24,49,129,179],"documents.":[21],"It":[22],"uses":[23],"to":[25,30,62,75,81,100,107],"identify":[26],"system":[28,89,114],"parameters":[29],"tune":[31],"as":[32,34,134,155,157],"well":[33,156],"recommended":[35,68],"parameter":[36],"values.":[37],"applies":[39],"large,":[40],"pre-trained":[41],"models":[43],"(specifically,":[44],"the":[45,102,112],"BERT":[46],"model)":[47],"for":[48,85,136],"analysis.":[50],"During":[51],"an":[52],"initial":[53],"training":[54],"phase,":[55],"it":[56],"fine-tunes":[57],"model":[58],"weights":[59],"in":[60],"order":[61],"translate":[63],"hints":[66,80],"into":[67],"settings.":[69],"At":[70],"run":[71,153],"time,":[72],"learns":[74],"aggregate,":[76],"adapt,":[77],"prioritize":[79],"achieve":[82],"optimal":[83],"performance":[84],"specific":[87],"benchmark.":[91],"Both":[92],"phases":[93],"are":[94],"iterative":[95],"use":[97],"reinforcement":[98],"learning":[99],"guide":[101],"selection":[103],"settings":[106,110,118],"evaluate":[108],"(penalizing":[109],"rejects":[115],"while":[116],"rewarding":[117],"improve":[120],"performance).":[121],"In":[122],"our":[123],"experiments,":[124],"we":[125],"leverage":[126],"hundreds":[127],"documents":[130],"about":[131,174],"input":[135],"DB-BERT.":[137],"We":[138],"compare":[139],"against":[141],"various":[142],"baselines,":[143],"considering":[144],"different":[145],"benchmarks":[146],"(TPC-C":[147],"TPC-H),":[149],"metrics":[150],"(throughput":[151],"time),":[154],"systems":[159],"(PostgreSQL":[160],"MySQL).":[162],"The":[163,188],"experiments":[164],"demonstrate":[165],"clearly":[166],"benefits":[169],"from":[170,178],"combining":[171],"general":[172],"tuning,":[176],"mined":[177],"documents,":[180],"with":[181],"scenario-specific":[182],"insights,":[183],"trial":[186],"runs.":[187],"full":[189],"source":[190],"code":[191],"available":[195],"online":[196],"at":[197],"https://itrummer.github.io/dbbert/":[198],".":[199]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
