{"id":"https://openalex.org/W7148798616","doi":"https://doi.org/10.48550/arxiv.2604.01330","title":"Evolutionary Multi-Objective Fusion of Deepfake Speech Detectors","display_name":"Evolutionary Multi-Objective Fusion of Deepfake Speech Detectors","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148798616","doi":"https://doi.org/10.48550/arxiv.2604.01330"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.01330","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.01330","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120499181","display_name":"Vojt\u011bch Stan\u011bk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stan\u011bk, Vojt\u011bch","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132888452","display_name":"Martin Pere\u0161\u00edni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pere\u0161\u00edni, Martin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055549968","display_name":"Luk\u00e1\u0161 Sekanina","orcid":"https://orcid.org/0000-0002-2693-9011"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sekanina, Luk\u00e1\u0161","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012747080","display_name":"Anton Firc","orcid":"https://orcid.org/0000-0002-4717-1910"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Firc, Anton","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5088145356","display_name":"Kamil Malinka","orcid":"https://orcid.org/0000-0002-9009-2193"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Malinka, Kamil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.8946999907493591,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.8946999907493591,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.059300001710653305,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.012799999676644802,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.7777000069618225},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6751000285148621},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.46399998664855957},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.46129998564720154},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4422999918460846},{"id":"https://openalex.org/keywords/pareto-principle","display_name":"Pareto principle","score":0.3935000002384186},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3781999945640564}],"concepts":[{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.7777000069618225},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7335000038146973},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6751000285148621},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4749000072479248},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.46399998664855957},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46129998564720154},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4422999918460846},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.3935000002384186},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3781999945640564},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3522000014781952},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.34929999709129333},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.33230000734329224},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.30570000410079956},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30410000681877136},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C153668964","wikidata":"https://www.wikidata.org/wiki/Q27636","display_name":"Majority rule","level":2,"score":0.29649999737739563},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.28940001130104065},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.259799987077713}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.01330","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.01330","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.01330","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"deepfake":[1],"speech":[2],"detectors":[3,83],"built":[4],"on":[5,75],"large":[6],"self-supervised":[7],"learning":[8],"(SSL)":[9],"models":[10],"achieve":[11],"high":[12],"accuracy,":[13],"employing":[14],"standard":[15],"ensemble":[16],"fusion":[17,39],"to":[18],"further":[19],"enhance":[20],"robustness":[21],"often":[22],"results":[23],"in":[24],"oversized":[25],"systems":[26],"with":[27,80],"diminishing":[28],"returns.":[29],"To":[30],"address":[31],"this,":[32],"we":[33],"propose":[34],"an":[35],"evolutionary":[36],"multi-objective":[37],"score":[38,60],"framework":[40],"that":[41,66,85,108,135],"jointly":[42],"minimizes":[43],"detection":[44],"error":[45],"and":[46,62,93,105,138],"system":[47,115],"complexity.":[48],"We":[49],"explore":[50],"two":[51],"encodings":[52],"optimized":[53],"by":[54],"NSGA-II:":[55],"binary-coded":[56],"detector":[57,68],"selection":[58],"for":[59,70],"averaging":[61,92],"a":[63,71,126],"real-valued":[64,98],"scheme":[65],"optimizes":[67],"weights":[69],"weighted":[72],"sum.":[73],"Experiments":[74],"the":[76,86,120],"ASVspoof":[77],"5":[78],"dataset":[79],"36":[81],"SSL-based":[82],"show":[84],"obtained":[87],"Pareto":[88],"fronts":[89],"outperform":[90],"simple":[91],"logistic":[94],"regression":[95],"baselines.":[96],"The":[97],"variant":[99],"achieves":[100],"2.37%":[101],"EER":[102],"(0.0684":[103],"minDCF)":[104],"identifies":[106],"configurations":[107],"match":[109],"state-of-the-art":[110],"performance":[111],"while":[112],"significantly":[113],"reducing":[114],"complexity,":[116],"requiring":[117],"only":[118],"half":[119],"parameters.":[121],"Our":[122],"method":[123],"also":[124],"provides":[125],"diverse":[127],"set":[128],"of":[129],"trade-off":[130],"solutions,":[131],"enabling":[132],"deployment":[133],"choices":[134],"balance":[136],"accuracy":[137],"computational":[139],"cost.":[140]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-04T00:00:00"}
