{"id":"https://openalex.org/W2037758579","doi":"https://doi.org/10.1145/1150402.1150422","title":"Reverse testing","display_name":"Reverse testing","publication_year":2006,"publication_date":"2006-08-20","ids":{"openalex":"https://openalex.org/W2037758579","doi":"https://doi.org/10.1145/1150402.1150422","mag":"2037758579"},"language":"en","primary_location":{"id":"doi:10.1145/1150402.1150422","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1150402.1150422","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100380588","display_name":"Wei Fan","orcid":"https://orcid.org/0009-0008-1900-7081"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Wei Fan","raw_affiliation_strings":["IBM T. J. Watson Research, Hawthorne, NY"],"affiliations":[{"raw_affiliation_string":"IBM T. J. Watson Research, Hawthorne, NY","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030289182","display_name":"Ian Davidson","orcid":"https://orcid.org/0000-0002-1258-4213"},"institutions":[{"id":"https://openalex.org/I392282","display_name":"University at Albany, State University of New York","ror":"https://ror.org/012zs8222","country_code":"US","type":"education","lineage":["https://openalex.org/I392282"]},{"id":"https://openalex.org/I113508548","display_name":"Albany State University","ror":"https://ror.org/01vme4277","country_code":"US","type":"education","lineage":["https://openalex.org/I113508548"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ian Davidson","raw_affiliation_strings":["University of Albany, State University of New York, Albany, NY"],"affiliations":[{"raw_affiliation_string":"University of Albany, State University of New York, Albany, NY","institution_ids":["https://openalex.org/I392282","https://openalex.org/I113508548"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100380588"],"corresponding_institution_ids":["https://openalex.org/I1341412227"],"apc_list":null,"apc_paid":null,"fwci":2.7912,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.90722662,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11871","display_name":"Advanced Statistical Methods and Models","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.684921145439148},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5894618034362793},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5648013949394226},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5488945245742798},{"id":"https://openalex.org/keywords/cross-validation","display_name":"Cross-validation","score":0.49616679549217224},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4907156229019165},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.48199573159217834},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.480352520942688},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4747091829776764},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19006574153900146}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.684921145439148},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5894618034362793},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5648013949394226},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5488945245742798},{"id":"https://openalex.org/C27181475","wikidata":"https://www.wikidata.org/wiki/Q541014","display_name":"Cross-validation","level":2,"score":0.49616679549217224},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4907156229019165},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.48199573159217834},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.480352520942688},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4747091829776764},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19006574153900146},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1150402.1150422","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1150402.1150422","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W740415","https://openalex.org/W1591673624","https://openalex.org/W1977245551","https://openalex.org/W2032536435","https://openalex.org/W2044758663","https://openalex.org/W2059575958","https://openalex.org/W2094062207","https://openalex.org/W2129851978","https://openalex.org/W2139122730","https://openalex.org/W2144996578","https://openalex.org/W2156909104","https://openalex.org/W2480680997","https://openalex.org/W2595697910","https://openalex.org/W6738852829"],"related_works":["https://openalex.org/W1630076647","https://openalex.org/W2371138613","https://openalex.org/W2080152487","https://openalex.org/W2048963458","https://openalex.org/W43109613","https://openalex.org/W2359952343","https://openalex.org/W2922249299","https://openalex.org/W2239445980","https://openalex.org/W2120455979","https://openalex.org/W1992324151"],"abstract_inverted_index":{"One":[0],"of":[1,47,90,106,123,144,151,218],"the":[2,13,21,25,31,34,69,74,102,134,148,152,173,202,219],"most":[3,135,174],"important":[4],"assumptions":[5],"made":[6],"by":[7],"many":[8,45,187],"classification":[9,107,125],"algorithms":[10],"is":[11,67,72,81,162,177],"that":[12,30,160,195],"training":[14,80,213],"and":[15,33,93,116],"test":[16,207],"sets":[17,37],"are":[18,38],"drawn":[19],"from":[20,40],"same":[22],"distribution,":[23],"i.e.,":[24],"so-called":[26],"\"stationary":[27],"distribution":[28],"assumption\"":[29],"future":[32,138],"past":[35],"data":[36,180],"identical":[39],"a":[41,88,142,210,216],"probabilistic":[42],"standpoint.":[43],"In":[44,95],"domains":[46],"real-world":[48,188],"applications,":[49],"such":[50,109,192],"as":[51,110],"marketing":[52],"solicitation,":[53],"fraud":[54],"detection,":[55],"drug":[56],"testing,":[57],"loan":[58],"approval,":[59],"sub-population":[60],"surveys,":[61],"school":[62],"enrollment":[63],"among":[64,141],"others,":[65],"this":[66],"rarely":[68],"case.":[70],"This":[71],"because":[73],"only":[75],"labeled":[76],"sample":[77,183],"available":[78],"for":[79,137,179,186],"biased":[82,130,212],"in":[83,215],"different":[84],"ways":[85],"due":[86],"to":[87,100,171,222],"variety":[89],"practical":[91],"reasons":[92],"limitations.":[94],"these":[96],"circumstances,":[97],"traditional":[98],"methods":[99],"evaluate":[101],"expected":[103],"generalization":[104],"error":[105],"algorithms,":[108],"structural":[111],"risk":[112],"minimization,":[113],"ten-fold":[114],"cross-validation,":[115],"leave-one-out":[117],"validation,":[118],"usually":[119],"return":[120],"poor":[121,159],"estimates":[122],"which":[124,198],"algorithm,":[126],"when":[127],"trained":[128],"on":[129,204],"dataset,":[131,140],"will":[132,200],"be":[133,157],"accurate":[136,175],"unbiased":[139,206],"number":[143],"competing":[145],"candidates.":[146],"Sometimes,":[147],"estimated":[149],"order":[150],"learning":[153],"algorithms'":[154],"accuracy":[155],"could":[156],"so":[158],"it":[161],"not":[163],"even":[164],"better":[165],"than":[166],"random":[167],"guessing.":[168],"Therefore,a":[169],"method":[170],"determine":[172,197],"learner":[176,199],"needed":[178],"mining":[181],"under":[182],"selection":[184],"bias":[185],"applications.":[189],"We":[190],"present":[191],"an":[193,205],"approach":[194],"can":[196],"perform":[201],"best":[203],"set,":[208,214],"given":[209],"possibly":[211],"fraction":[217],"computational":[220],"cost":[221],"use":[223],"cross-validation":[224],"based":[225],"approaches.":[226]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2016-06-24T00:00:00"}
