{"id":"https://openalex.org/W7109215121","doi":"https://doi.org/10.1145/3769839","title":"Understanding and Detecting Query Performance Regression in Practical Index Tuning: [Experiments &amp; Analysis]","display_name":"Understanding and Detecting Query Performance Regression in Practical Index Tuning: [Experiments &amp; Analysis]","publication_year":2025,"publication_date":"2025-12-04","ids":{"openalex":"https://openalex.org/W7109215121","doi":"https://doi.org/10.1145/3769839"},"language":"en","primary_location":{"id":"doi:10.1145/3769839","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3769839","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1145/3769839","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wentao Wu","orcid":"https://orcid.org/0009-0006-2454-7109"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Wentao Wu","raw_affiliation_strings":["Microsoft Research, Redmond, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Anshuman Dutt","orcid":"https://orcid.org/0000-0003-2861-4883"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anshuman Dutt","raw_affiliation_strings":["Microsoft Research, Redmond, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Gaoxiang Xu","orcid":"https://orcid.org/0000-0001-7319-2857"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gaoxiang Xu","raw_affiliation_strings":["Microsoft Research, Redmond, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Vivek Narasayya","orcid":"https://orcid.org/0000-0001-7011-7886"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vivek Narasayya","raw_affiliation_strings":["Microsoft Research, Redmond, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":null,"display_name":"Surajit Chaudhuri","orcid":"https://orcid.org/0000-0001-8252-5270"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Surajit Chaudhuri","raw_affiliation_strings":["Microsoft Research, Redmond, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.61906412,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"3","issue":"6","first_page":"1","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.32030001282691956,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.32030001282691956,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.22750000655651093,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.11940000206232071,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6600000262260437},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.6527000069618225},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.49300000071525574},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.4652000069618225},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.44620001316070557},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.39910000562667847},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.37119999527931213},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.3433000147342682}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7857000231742859},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6600000262260437},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.6527000069618225},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6370000243186951},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.49300000071525574},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.4652000069618225},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.44620001316070557},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.39910000562667847},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.37119999527931213},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34459999203681946},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.3433000147342682},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32690000534057617},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.31540000438690186},{"id":"https://openalex.org/C130590232","wikidata":"https://www.wikidata.org/wiki/Q1671754","display_name":"Inverted index","level":3,"score":0.31139999628067017},{"id":"https://openalex.org/C2776836416","wikidata":"https://www.wikidata.org/wiki/Q1364844","display_name":"False alarm","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C192939062","wikidata":"https://www.wikidata.org/wiki/Q104840822","display_name":"Sargable","level":4,"score":0.29170000553131104},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.28600001335144043},{"id":"https://openalex.org/C59276292","wikidata":"https://www.wikidata.org/wiki/Q580427","display_name":"Database index","level":3,"score":0.2854999899864197},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.2671000063419342},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.25529998540878296},{"id":"https://openalex.org/C2779729312","wikidata":"https://www.wikidata.org/wiki/Q784232","display_name":"Query plan","level":5,"score":0.25429999828338623},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2526000142097473}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3769839","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3769839","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3769839","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3769839","pdf_url":null,"source":{"id":"https://openalex.org/S4387289859","display_name":"Proceedings of the ACM on Management of Data","issn_l":"2836-6573","issn":["2836-6573"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Management of Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W2081728040","https://openalex.org/W2098443134","https://openalex.org/W2103702871","https://openalex.org/W2145676903","https://openalex.org/W2167978511","https://openalex.org/W2338318698","https://openalex.org/W2396309311","https://openalex.org/W2565516711","https://openalex.org/W2883510886","https://openalex.org/W2911464154","https://openalex.org/W2970148517","https://openalex.org/W2998249308","https://openalex.org/W3011998105","https://openalex.org/W3094011786","https://openalex.org/W3095166039","https://openalex.org/W3111141572","https://openalex.org/W3165842875","https://openalex.org/W3207801254","https://openalex.org/W4211032723","https://openalex.org/W4283326127","https://openalex.org/W4294903983","https://openalex.org/W4312656534","https://openalex.org/W4313138291","https://openalex.org/W4386128208","https://openalex.org/W4391055215","https://openalex.org/W4393183958","https://openalex.org/W4403636019"],"related_works":[],"abstract_inverted_index":{"Existing":[0],"index":[1,27,68,131,143,156],"tuners":[2],"typically":[3],"rely":[4],"on":[5,23],"the":[6,12,17,46,88,93,116,129,136,165,180,198],"''what":[7],"if''":[8],"API":[9],"provided":[10],"by":[11],"query":[13,22,41,117],"optimizer":[14],"to":[15,39,86,103,128,171],"estimate":[16],"execution":[18],"cost":[19,30],"of":[20,25,81,90,164,175],"a":[21,53,172,188],"top":[24],"an":[26,71,110],"configuration.":[28],"Such":[29],"estimates":[31],"can":[32,168,202],"be":[33,169],"inaccurate":[34],"and":[35,106,122,149,184],"may":[36],"therefore":[37],"lead":[38],"significant":[40,120,166],"performance":[42],"regression":[43],"(QPR)":[44],"once":[45],"recommended":[47],"indexes":[48],"are":[49],"materialized.":[50],"This":[51],"becomes":[52],"serious":[54],"problem":[55],"for":[56,124,142,153],"cloud":[57],"database":[58,151],"providers,":[59],"such":[60,140],"as":[61,70],"Microsoft's":[62],"Azure":[63],"SQL":[64],"Database,":[65],"that":[66,133,162,197],"offer":[67],"tuning":[69,144,157],"automated":[72],"service":[73],"(a.k.a.":[74],"''auto-indexing'').":[75],"Previous":[76],"work":[77],"has":[78],"explored":[79],"use":[80],"supervised":[82],"machine":[83],"learning":[84],"(ML)":[85],"reduce":[87],"likelihood":[89],"QPR.":[91,137],"However,":[92],"trained":[94],"ML":[95],"models":[96],"have":[97],"limited":[98],"generalization":[99],"capability":[100],"when":[101],"applied":[102],"new":[104,130],"databases":[105],"workloads.":[107],"We":[108,138],"propose":[109,187],"alternative":[111],"approach":[112],"where":[113],"we":[114,185],"analyze":[115],"plans":[118],"with":[119],"QPRs":[121,167],"look":[123],"structural":[125,181],"changes":[126],"due":[127],"configuration":[132],"could":[134],"explain":[135],"perform":[139],"study":[141,160],"data":[145],"across":[146],"many":[147],"benchmark":[148],"real-world":[150],"workloads,":[152],"multiple":[154],"realistic":[155],"scenarios.":[158],"Our":[159,193],"reveals":[161],"most":[163],"attributed":[170],"small":[173],"number":[174],"common":[176],"''regression":[177],"patterns''":[178],"characterizing":[179],"plan":[182],"changes,":[183],"further":[186],"pattern-based":[189,199],"QPR":[190,200,207],"detector":[191,201],"accordingly.":[192],"experimental":[194],"evaluation":[195],"shows":[196],"significantly":[203],"outperform":[204],"existing":[205],"ML-based":[206],"detectors.":[208]},"counts_by_year":[],"updated_date":"2025-12-06T23:14:57.273132","created_date":"2025-12-06T00:00:00"}
