{"id":"https://openalex.org/W4413075732","doi":"https://doi.org/10.1186/s40537-025-01217-3","title":"Enhancing fraud detection in imbalanced motor insurance datasets using CP-SMOTE and Random Under-Sampling","display_name":"Enhancing fraud detection in imbalanced motor insurance datasets using CP-SMOTE and Random Under-Sampling","publication_year":2025,"publication_date":"2025-07-17","ids":{"openalex":"https://openalex.org/W4413075732","doi":"https://doi.org/10.1186/s40537-025-01217-3"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-025-01217-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01217-3","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01217-3.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01217-3.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119257310","display_name":"Pornpawee Komsrimorakot","orcid":null},"institutions":[{"id":"https://openalex.org/I159665162","display_name":"National Institute of Development Administration","ror":"https://ror.org/010g30191","country_code":"TH","type":"education","lineage":["https://openalex.org/I159665162"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Pornpawee Komsrimorakot","raw_affiliation_strings":["Graduate School of Applied Statistics, National Institute of Development Administration, 148 SeriThai Road, Klong-Chan, Bangkapi, Bangkok, 10240, Thailand"],"affiliations":[{"raw_affiliation_string":"Graduate School of Applied Statistics, National Institute of Development Administration, 148 SeriThai Road, Klong-Chan, Bangkapi, Bangkok, 10240, Thailand","institution_ids":["https://openalex.org/I159665162"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014498955","display_name":"Thitirat Siriborvornratanakul","orcid":"https://orcid.org/0000-0002-6530-5302"},"institutions":[{"id":"https://openalex.org/I159665162","display_name":"National Institute of Development Administration","ror":"https://ror.org/010g30191","country_code":"TH","type":"education","lineage":["https://openalex.org/I159665162"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Thitirat Siriborvornratanakul","raw_affiliation_strings":["Graduate School of Applied Statistics, National Institute of Development Administration, 148 SeriThai Road, Klong-Chan, Bangkapi, Bangkok, 10240, Thailand"],"affiliations":[{"raw_affiliation_string":"Graduate School of Applied Statistics, National Institute of Development Administration, 148 SeriThai Road, Klong-Chan, Bangkapi, Bangkok, 10240, Thailand","institution_ids":["https://openalex.org/I159665162"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5119257310"],"corresponding_institution_ids":["https://openalex.org/I159665162"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":15.6742,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.98799917,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"12","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9782999753952026,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7659968137741089},{"id":"https://openalex.org/keywords/insurance-fraud","display_name":"Insurance fraud","score":0.7297030091285706},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5436834692955017},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4976406395435333},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.4360889196395874},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.41850265860557556},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.396803617477417},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3797743320465088},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3324270248413086},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.09884494543075562},{"id":"https://openalex.org/keywords/actuarial-science","display_name":"Actuarial science","score":0.09547066688537598},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08955934643745422}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7659968137741089},{"id":"https://openalex.org/C2778976927","wikidata":"https://www.wikidata.org/wiki/Q838081","display_name":"Insurance fraud","level":2,"score":0.7297030091285706},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5436834692955017},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4976406395435333},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.4360889196395874},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.41850265860557556},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.396803617477417},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3797743320465088},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3324270248413086},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.09884494543075562},{"id":"https://openalex.org/C162118730","wikidata":"https://www.wikidata.org/wiki/Q1128453","display_name":"Actuarial science","level":1,"score":0.09547066688537598},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08955934643745422},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-025-01217-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01217-3","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01217-3.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:557550b969a142caba1d3746b08c90ac","is_oa":true,"landing_page_url":"https://doaj.org/article/557550b969a142caba1d3746b08c90ac","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 12, Iss 1, Pp 1-22 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-025-01217-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01217-3","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01217-3.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.4399999976158142,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4413075732.pdf","grobid_xml":"https://content.openalex.org/works/W4413075732.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1993220166","https://openalex.org/W2104933073","https://openalex.org/W2148143831","https://openalex.org/W2296337638","https://openalex.org/W2333568743","https://openalex.org/W2751515787","https://openalex.org/W2892493782","https://openalex.org/W2904542630","https://openalex.org/W2908465383","https://openalex.org/W2985407284","https://openalex.org/W3035922394","https://openalex.org/W3040219594","https://openalex.org/W3080526713","https://openalex.org/W3091924507","https://openalex.org/W3186655196","https://openalex.org/W4205815544","https://openalex.org/W4221074700","https://openalex.org/W4283018934","https://openalex.org/W4286433211","https://openalex.org/W4316021877","https://openalex.org/W4323051174","https://openalex.org/W4387745472","https://openalex.org/W4388011682","https://openalex.org/W4388996683","https://openalex.org/W4389037881","https://openalex.org/W4390284838","https://openalex.org/W4391554661","https://openalex.org/W4395673980","https://openalex.org/W4400431367","https://openalex.org/W4400599071","https://openalex.org/W4406614817","https://openalex.org/W4406832705"],"related_works":["https://openalex.org/W3193043704","https://openalex.org/W4386259002","https://openalex.org/W1546989560","https://openalex.org/W3171520305","https://openalex.org/W1924178503","https://openalex.org/W3135126032","https://openalex.org/W2361887085","https://openalex.org/W4308716060","https://openalex.org/W4280648719","https://openalex.org/W4394984040"],"abstract_inverted_index":{"Detecting":[0],"fraudulent":[1,17,99],"claims":[2],"in":[3,173],"motor":[4,75],"insurance":[5,76,175],"remains":[6],"a":[7,25,44,121,124,132],"critical":[8,152],"challenge":[9],"due":[10],"to":[11,58],"the":[12,90,108,111,128,139,151],"severe":[13],"class":[14,61,155],"imbalance":[15,81],"between":[16],"and":[18,33,83,107,157,163],"legitimate":[19],"cases.":[20],"This":[21,136],"study":[22,137],"systematically":[23],"evaluates":[24],"diverse":[26],"set":[27],"of":[28,105,134,141,154],"resampling":[29],"strategies\u2014including":[30],"oversampling,":[31],"under-sampling,":[32],"hybrid":[34,46],"methods\u2014in":[35],"combination":[36,94],"with":[37,54,123],"multiple":[38,146],"machine":[39],"learning":[40],"classifiers.":[41],"We":[42],"propose":[43],"novel":[45],"technique":[47],"that":[48,89],"integrates":[49],"Center":[50],"Point":[51],"SMOTE":[52],"(CP-SMOTE)":[53],"Random":[55],"Under-Sampling":[56],"(RUS)":[57],"effectively":[59],"address":[60],"imbalance.":[62],"To":[63],"evaluate":[64],"its":[65],"generalizability,":[66],"this":[67],"approach":[68],"was":[69],"applied":[70],"across":[71,115,145],"three":[72],"publicly":[73],"available":[74],"datasets,":[77],"each":[78],"exhibiting":[79],"distinct":[80],"ratios":[82],"feature":[84,158],"complexities.":[85],"Experimental":[86],"results":[87],"demonstrate":[88],"CP-SMOTE":[91,142],"+":[92,143],"RUS":[93,144],"consistently":[95],"enhances":[96],"recall":[97,133],"for":[98,167],"cases":[100],"while":[101],"maintaining":[102],"acceptable":[103],"levels":[104],"precision":[106],"area":[109],"under":[110],"precision-recall":[112],"curve":[113],"(AUC-PR)":[114],"different":[116],"model":[117,161],"configurations.":[118],"Notably,":[119],"on":[120,160],"dataset":[122],"1:16":[125],"fraud-to-non-fraud":[126],"ratio,":[127],"polynomial-kernel":[129],"SVM":[130],"achieved":[131],"94.03%.":[135],"validates":[138],"robustness":[140],"datasets.":[147],"The":[148],"findings":[149],"underscore":[150],"impact":[153],"distribution":[156],"dimensionality":[159],"performance":[162],"offer":[164],"actionable":[165],"insights":[166],"deploying":[168],"high-recall":[169],"fraud":[170],"detection":[171],"systems":[172],"real-world":[174],"applications.":[176]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
