{"id":"https://openalex.org/W4410812226","doi":"https://doi.org/10.1007/s10618-025-01107-5","title":"Data-driven learning optimal K values for K-nearest neighbour matching in causal inference","display_name":"Data-driven learning optimal K values for K-nearest neighbour matching in causal inference","publication_year":2025,"publication_date":"2025-05-28","ids":{"openalex":"https://openalex.org/W4410812226","doi":"https://doi.org/10.1007/s10618-025-01107-5"},"language":"en","primary_location":{"id":"doi:10.1007/s10618-025-01107-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10618-025-01107-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10618-025-01107-5.pdf","source":{"id":"https://openalex.org/S121920818","display_name":"Data Mining and Knowledge Discovery","issn_l":"1384-5810","issn":["1384-5810","1573-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Mining and Knowledge Discovery","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10618-025-01107-5.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101638514","display_name":"Yinghao Zhang","orcid":"https://orcid.org/0009-0007-5165-4898"},"institutions":[{"id":"https://openalex.org/I204823248","display_name":"Huazhong Agricultural University","ror":"https://ror.org/023b72294","country_code":"CN","type":"education","lineage":["https://openalex.org/I204823248"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yinghao Zhang","raw_affiliation_strings":["College of Informatics, Huazhong Agricultural University, Wuhan, 430070, Hubei, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Huazhong Agricultural University, Wuhan, 430070, Hubei, China","institution_ids":["https://openalex.org/I204823248"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101887212","display_name":"Tingting Xu","orcid":"https://orcid.org/0000-0002-4399-7379"},"institutions":[{"id":"https://openalex.org/I204823248","display_name":"Huazhong Agricultural University","ror":"https://ror.org/023b72294","country_code":"CN","type":"education","lineage":["https://openalex.org/I204823248"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingting Xu","raw_affiliation_strings":["College of Informatics, Huazhong Agricultural University, Wuhan, 430070, Hubei, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Huazhong Agricultural University, Wuhan, 430070, Hubei, China","institution_ids":["https://openalex.org/I204823248"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065281913","display_name":"Debo Cheng","orcid":"https://orcid.org/0000-0002-0383-1462"},"institutions":[{"id":"https://openalex.org/I170239107","display_name":"University of South Australia","ror":"https://ror.org/01p93h210","country_code":"AU","type":"education","lineage":["https://openalex.org/I170239107"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Debo Cheng","raw_affiliation_strings":["UniSA STEM, University of South Australia, Adelaide, SA, 5095, Australia"],"affiliations":[{"raw_affiliation_string":"UniSA STEM, University of South Australia, Adelaide, SA, 5095, Australia","institution_ids":["https://openalex.org/I170239107"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012177739","display_name":"Jiuyong Li","orcid":"https://orcid.org/0000-0002-9023-1878"},"institutions":[{"id":"https://openalex.org/I170239107","display_name":"University of South Australia","ror":"https://ror.org/01p93h210","country_code":"AU","type":"education","lineage":["https://openalex.org/I170239107"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jiuyong Li","raw_affiliation_strings":["UniSA STEM, University of South Australia, Adelaide, SA, 5095, Australia"],"affiliations":[{"raw_affiliation_string":"UniSA STEM, University of South Australia, Adelaide, SA, 5095, Australia","institution_ids":["https://openalex.org/I170239107"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100383312","display_name":"Lin Liu","orcid":"https://orcid.org/0000-0002-7202-3418"},"institutions":[{"id":"https://openalex.org/I170239107","display_name":"University of South Australia","ror":"https://ror.org/01p93h210","country_code":"AU","type":"education","lineage":["https://openalex.org/I170239107"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Lin Liu","raw_affiliation_strings":["UniSA STEM, University of South Australia, Adelaide, SA, 5095, Australia"],"affiliations":[{"raw_affiliation_string":"UniSA STEM, University of South Australia, Adelaide, SA, 5095, Australia","institution_ids":["https://openalex.org/I170239107"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100743349","display_name":"Ziqi Xu","orcid":"https://orcid.org/0000-0003-1748-5801"},"institutions":[{"id":"https://openalex.org/I82951845","display_name":"RMIT University","ror":"https://ror.org/04ttjf776","country_code":"AU","type":"education","lineage":["https://openalex.org/I82951845"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ziqi Xu","raw_affiliation_strings":["School of Computing Technologies, RMIT University, Melbourne, VIC, 3000, Australia"],"affiliations":[{"raw_affiliation_string":"School of Computing Technologies, RMIT University, Melbourne, VIC, 3000, Australia","institution_ids":["https://openalex.org/I82951845"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049033206","display_name":"Zaiwen Feng","orcid":"https://orcid.org/0000-0003-1618-3553"},"institutions":[{"id":"https://openalex.org/I204823248","display_name":"Huazhong Agricultural University","ror":"https://ror.org/023b72294","country_code":"CN","type":"education","lineage":["https://openalex.org/I204823248"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zaiwen Feng","raw_affiliation_strings":["College of Informatics, Huazhong Agricultural University, Wuhan, 430070, Hubei, China"],"affiliations":[{"raw_affiliation_string":"College of Informatics, Huazhong Agricultural University, Wuhan, 430070, Hubei, China","institution_ids":["https://openalex.org/I204823248"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5065281913"],"corresponding_institution_ids":["https://openalex.org/I170239107"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":2.4915,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8799287,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"39","issue":"4","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10845","display_name":"Advanced Causal Inference Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10845","display_name":"Advanced Causal Inference Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/causal-inference","display_name":"Causal inference","score":0.6402007937431335},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5266002416610718},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5232164859771729},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.522839367389679},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5085529088973999},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.4516337811946869},{"id":"https://openalex.org/keywords/propensity-score-matching","display_name":"Propensity score matching","score":0.43039563298225403},{"id":"https://openalex.org/keywords/covariate","display_name":"Covariate","score":0.4267899990081787},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4149743318557739},{"id":"https://openalex.org/keywords/observational-study","display_name":"Observational study","score":0.4142933487892151},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40777990221977234},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.36189666390419006},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3427433967590332},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3384314775466919}],"concepts":[{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.6402007937431335},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5266002416610718},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5232164859771729},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.522839367389679},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5085529088973999},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.4516337811946869},{"id":"https://openalex.org/C17923572","wikidata":"https://www.wikidata.org/wiki/Q7250160","display_name":"Propensity score matching","level":2,"score":0.43039563298225403},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.4267899990081787},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4149743318557739},{"id":"https://openalex.org/C23131810","wikidata":"https://www.wikidata.org/wiki/Q818574","display_name":"Observational study","level":2,"score":0.4142933487892151},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40777990221977234},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.36189666390419006},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3427433967590332},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3384314775466919}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10618-025-01107-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10618-025-01107-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10618-025-01107-5.pdf","source":{"id":"https://openalex.org/S121920818","display_name":"Data Mining and Knowledge Discovery","issn_l":"1384-5810","issn":["1384-5810","1573-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Mining and Knowledge Discovery","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10618-025-01107-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10618-025-01107-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10618-025-01107-5.pdf","source":{"id":"https://openalex.org/S121920818","display_name":"Data Mining and Knowledge Discovery","issn_l":"1384-5810","issn":["1384-5810","1573-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Data Mining and Knowledge Discovery","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G34411200","display_name":null,"funder_award_id":"DP230101122","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"}],"funders":[{"id":"https://openalex.org/F4320320979","display_name":"University of South Australia","ror":"https://ror.org/01p93h210"},{"id":"https://openalex.org/F4320334704","display_name":"Australian Research Council","ror":"https://ror.org/05mmh0f86"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4410812226.pdf","grobid_xml":"https://content.openalex.org/works/W4410812226.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W1967969088","https://openalex.org/W2030614017","https://openalex.org/W2049910836","https://openalex.org/W2055759517","https://openalex.org/W2059484129","https://openalex.org/W2064903582","https://openalex.org/W2069959554","https://openalex.org/W2124541940","https://openalex.org/W2132324013","https://openalex.org/W2132917208","https://openalex.org/W2135957123","https://openalex.org/W2136484149","https://openalex.org/W2148385623","https://openalex.org/W2150291618","https://openalex.org/W2155163959","https://openalex.org/W2208550830","https://openalex.org/W2286582633","https://openalex.org/W2335437633","https://openalex.org/W2515189678","https://openalex.org/W2762488802","https://openalex.org/W2792296590","https://openalex.org/W2794031572","https://openalex.org/W2962727190","https://openalex.org/W3086776987","https://openalex.org/W3090469996","https://openalex.org/W3124999902","https://openalex.org/W3125459412","https://openalex.org/W3150893739","https://openalex.org/W4234961057","https://openalex.org/W4241916448","https://openalex.org/W4378419993","https://openalex.org/W4387850600","https://openalex.org/W4389386407","https://openalex.org/W6603717528"],"related_works":["https://openalex.org/W2464681697","https://openalex.org/W2575790444","https://openalex.org/W2947954788","https://openalex.org/W4296363906","https://openalex.org/W4322505266","https://openalex.org/W4281756720","https://openalex.org/W4385077270","https://openalex.org/W2541915084","https://openalex.org/W4225280467","https://openalex.org/W304115605"],"abstract_inverted_index":{"Abstract":[0],"Within":[1],"the":[2,85,124,149],"realm":[3],"of":[4,88],"causal":[5,11,66,170],"inference,":[6],"a":[7,40,62,79,97,110],"pivotal":[8],"task":[9],"involves":[10],"effect":[12,67],"estimation":[13,68],"from":[14,145,172],"observational":[15,173],"data":[16,174],"when":[17],"there":[18],"exist":[19],"confounding":[20,33,142],"variables.":[21],"The":[22,75],"K-Nearest":[23,71],"Neighbour":[24,72],"Matching":[25,73],"(K-NNM)":[26],"method":[27,64,77],"is":[28],"widely":[29],"applied":[30],"to":[31,50,83,113,139],"handle":[32],"bias,":[34],"but":[35],"its":[36],"general":[37],"application":[38],"sets":[39],"uniform":[41],"K":[42,89],"value":[43,87],"for":[44,65,90,101,128],"all":[45,102],"samples,":[46],"which":[47],"can":[48],"lead":[49],"suboptimal":[51],"results":[52],"in":[53,168],"practice.":[54],"To":[55],"overcome":[56],"this":[57,59],"limitation,":[58],"paper":[60],"introduces":[61],"novel":[63],"called":[69],"Dynamic":[70],"(DK-NNM).":[74],"DK-NNM":[76,95,132,164],"employs":[78],"data-driven":[80],"learning":[81,109],"strategy":[82],"determine":[84],"optimal":[86],"each":[91,129],"sample.":[92,130],"In":[93],"practice,":[94],"reconstructs":[96],"sparse":[98,105],"coefficient":[99],"matrix":[100,112],"samples":[103],"using":[104],"learning,":[106],"while":[107],"simultaneously":[108],"graph":[111],"preserve":[114],"local":[115],"information":[116],"and":[117,136,158,175],"sample":[118],"similarity.":[119],"This":[120],"approach":[121],"helps":[122],"identify":[123],"most":[125],"suitable":[126],"K-value":[127],"Additionally,":[131],"utilizes":[133],"joint":[134],"propensity":[135],"prognostic":[137],"scores":[138],"effectively":[140],"mitigate":[141],"bias":[143],"arising":[144],"high-dimensional":[146],"covariates":[147],"during":[148],"K-NNM":[150],"process.":[151],"Experiments":[152],"performed":[153],"on":[154],"various":[155],"synthetic,":[156],"semi-synthetic,":[157],"real-world":[159],"datasets":[160],"conclusively":[161],"demonstrate":[162],"that":[163],"surpasses":[165],"baseline":[166],"models":[167],"estimating":[169],"effects":[171],"provides":[176],"significant":[177],"improvements":[178],"over":[179],"traditional":[180],"methods.":[181]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
