{"id":"https://openalex.org/W6888038679","doi":"https://doi.org/10.18420/btw2023-16","title":"Approach to Synthetic Data Generation for Imbalanced Multi-class Problems with Heterogeneous Groups","display_name":"Approach to Synthetic Data Generation for Imbalanced Multi-class Problems with Heterogeneous Groups","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W6888038679","doi":"https://doi.org/10.18420/btw2023-16"},"language":"en","primary_location":{"id":"doi:10.18420/btw2023-16","is_oa":true,"landing_page_url":"https://doi.org/10.18420/btw2023-16","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article-journal"},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.18420/btw2023-16","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Treder-Tschechlov, Dennis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Treder-Tschechlov, Dennis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Reimann, Peter","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reimann, Peter","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Schwarz, Holger","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwarz, Holger","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Mitschang, Bernhard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mitschang, Bernhard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.1632,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.61217853,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9549999833106995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9549999833106995,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11653","display_name":"Financial Distress and Bankruptcy Prediction","score":0.012500000186264515,"subfield":{"id":"https://openalex.org/subfields/1402","display_name":"Accounting"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.003100000089034438,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4887999892234802},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.46869999170303345},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4406999945640564},{"id":"https://openalex.org/keywords/data-type","display_name":"Data type","score":0.4235999882221222},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.3422999978065491}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7354999780654907},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.548799991607666},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4887999892234802},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4812999963760376},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.46869999170303345},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4406999945640564},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.4235999882221222},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.397599995136261},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3422999978065491},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.313400000333786},{"id":"https://openalex.org/C2780724565","wikidata":"https://www.wikidata.org/wiki/Q5227256","display_name":"Data classification","level":2,"score":0.3005000054836273},{"id":"https://openalex.org/C3020493868","wikidata":"https://www.wikidata.org/wiki/Q55631277","display_name":"Real world data","level":2,"score":0.27639999985694885}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18420/btw2023-16","is_oa":true,"landing_page_url":"https://doi.org/10.18420/btw2023-16","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"doi:10.18420/btw2023-16","is_oa":true,"landing_page_url":"https://doi.org/10.18420/btw2023-16","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article-journal"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"To":[0],"benchmark":[1],"novel":[2],"classification":[3,30],"algorithms,":[4],"these":[5,42,162,234],"algorithms":[6],"should":[7],"be":[8,69,92],"evaluated":[9],"on":[10,72],"data":[11,22,39,83,96,103,107,133,157,214,218],"with":[12],"characteristics":[13,23,43,67,90,160,219],"that":[14,24,40,85,104,123,134,147,209,215,226],"also":[15],"appear":[16],"in":[17,151,187,203],"real-world":[18,73,149,180],"use":[19,142,181],"cases.":[20,182],"Important":[21],"often":[25],"lead":[26],"to":[27,59,80,101,130,155,170,229],"challenges":[28],"for":[29],"approaches":[31],"are":[32,44,98,192,201],"multi-class":[33,111,220],"imbalance":[34,112,221],"and":[35,113,177,199,222,225],"heterogeneous":[36,114,153,223],"groups.":[37,115,163],"Real-world":[38],"comprise":[41],"usually":[45],"not":[46,99],"publicly":[47],"available,":[48],"e.":[49],"g.,":[50],"because":[51],"they":[52],"constitute":[53],"sensible":[54],"patient":[55],"information":[56],"or":[57],"due":[58],"privacy":[60],"concerns.":[61],"Further,":[62],"the":[63,66,89,159,172,193,217],"manifestations":[64,87,232],"of":[65,88,143,161,174,196,233],"cannot":[68],"controlled":[70],"specifically":[71],"data.":[74],"A":[75],"more":[76],"rigorous":[77],"approach":[78,122,184,211],"is":[79,185],"synthetically":[81,131],"generate":[82,102,132,156,213],"such":[84],"different":[86,188,231],"can":[91,212],"controlled.":[93],"However,":[94],"existing":[95],"generators":[97],"able":[100],"feature":[105,216],"both":[106,136],"characteristics,":[108],"i.":[109],"e.,":[110],"In":[116,138,164],"this":[117,125],"paper,":[118],"we":[119,140,166],"propose":[120],"an":[121],"fills":[124],"gap":[126],"as":[127,190],"it":[128,227],"allows":[129,228],"exhibit":[135],"characteristics.":[137,235],"particular,":[139],"make":[141],"a":[144],"taxonomy":[145],"model":[146],"organizes":[148],"entities":[150],"domain-specific":[152],"groups":[154,178,224],"reflecting":[158],"addition,":[165],"incorporate":[167],"probability":[168],"distributions":[169],"reflect":[171],"imbalances":[173],"multiple":[175],"classes":[176],"from":[179],"Our":[183],"applicable":[186],"domains,":[189],"taxonomies":[191],"simplest":[194],"form":[195],"knowledge":[197],"models":[198],"thus":[200],"available":[202],"many":[204],"domains.":[205],"The":[206],"evaluation":[207],"shows":[208],"our":[210],"control":[230]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
