{"id":"https://openalex.org/W7118816710","doi":"https://doi.org/10.48550/arxiv.2601.02432","title":"Quantifying Quanvolutional Neural Networks Robustness for Speech in Healthcare Applications","display_name":"Quantifying Quanvolutional Neural Networks Robustness for Speech in Healthcare Applications","publication_year":2026,"publication_date":"2026-01-05","ids":{"openalex":"https://openalex.org/W7118816710","doi":"https://doi.org/10.48550/arxiv.2601.02432"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.02432","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02432","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.02432","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122158357","display_name":"Ha Tran","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tran, Ha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122069757","display_name":"Bipasha Kashyap","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kashyap, Bipasha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5037113249","display_name":"Pubudu N. Pathirana","orcid":"https://orcid.org/0000-0001-8014-7798"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pathirana, Pubudu N.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5122158357"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.179299995303154,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.179299995303154,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.12309999763965607,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.07410000264644623,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8585000038146973},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5979999899864197},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4697999954223633},{"id":"https://openalex.org/keywords/gaussian-noise","display_name":"Gaussian noise","score":0.4575999975204468},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.39649999141693115},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36340001225471497}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8585000038146973},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6995000243186951},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5979999899864197},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4697999954223633},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4587000012397766},{"id":"https://openalex.org/C4199805","wikidata":"https://www.wikidata.org/wiki/Q2725903","display_name":"Gaussian noise","level":2,"score":0.4575999975204468},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45730000734329224},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40700000524520874},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.39649999141693115},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36340001225471497},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.36090001463890076},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.35839998722076416},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.3138999938964844},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.25929999351501465}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.02432","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02432","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.02432","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02432","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8188708424568176,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Speech-based":[0],"machine":[1,26],"learning":[2,27],"systems":[3],"are":[4],"sensitive":[5],"to":[6,72,116,130,174,184,221],"noise,":[7,44],"complicating":[8],"reliable":[9],"deployment":[10],"in":[11,52],"emotion":[12],"recognition":[13],"and":[14,49,60,79,83,90,112,144,169,177],"voice":[15],"pathology":[16],"detection.":[17],"We":[18],"evaluate":[19],"the":[20,105,125,138,189],"robustness":[21,141,201],"of":[22,199],"a":[23,53,73,196,225],"hybrid":[24],"quantum":[25,134,213],"model,":[28],"quanvolutional":[29],"neural":[30,36],"networks":[31,37],"(QNNs)":[32],"against":[33],"classical":[34],"convolutional":[35],"(CNNs)":[38],"under":[39,107,157,163,204],"four":[40],"acoustic":[41,207],"corruptions":[42],"(Gaussian":[43],"pitch":[45,108],"shift,":[46,48,109,111],"temporal":[47,110,122],"speed":[50,113,178],"variation)":[51],"clean-train/corrupted-test":[54],"regime.":[55],"Using":[56],"AVFAD":[57],"(voice":[58],"pathology)":[59],"TESS":[61],"(speech":[62],"emotion),":[63],"we":[64],"compare":[65],"three":[66],"QNN":[67,200],"models":[68],"(Random,":[69],"Basic,":[70],"Strongly)":[71],"simple":[74],"CNN":[75],"baseline":[76],"(CNN-Base),":[77],"ResNet-18":[78],"VGG-16":[80],"using":[81],"accuracy":[82,156],"corruption":[84],"metrics":[85],"(CE,":[86],"mCE,":[87],"RCE,":[88],"RmCE),":[89],"analyze":[91],"architectural":[92],"factors":[93],"(circuit":[94],"complexity":[95],"or":[96],"depth,":[97],"convergence)":[98],"alongside":[99],"per-emotion":[100],"robustness.":[101],"QNNs":[102,180],"generally":[103],"outperform":[104],"CNN-Base":[106,126],"variation":[114],"(up":[115],"22%":[117],"lower":[118],"CE/RCE":[119],"at":[120],"severe":[121,158],"shift),":[123],"while":[124,219],"remains":[127,224],"more":[128],"resilient":[129],"Gaussian":[131,165],"noise.":[132],"Among":[133],"circuits,":[135],"QNN-Basic":[136],"achieves":[137],"best":[139],"overall":[140],"on":[142,148],"AVFAD,":[143],"QNN-Random":[145],"performs":[146],"strongest":[147],"TESS.":[149],"Emotion-wise,":[150],"fear":[151],"is":[152,171,195],"most":[153,172],"robust":[154],"(80-90%":[155],"corruptions),":[159],"neutral":[160],"can":[161,215],"collapse":[162],"strong":[164],"noise":[166,217,223],"(5.5%":[167],"accuracy),":[168],"happy":[170],"vulnerable":[173],"pitch,":[175],"temporal,":[176],"distortions.":[179],"also":[181],"converge":[182],"up":[183],"six":[185],"times":[186],"faster":[187],"than":[188],"CNN-Base.":[190],"To":[191],"our":[192],"knowledge,":[193],"this":[194],"systematic":[197],"study":[198],"for":[202],"speech":[203],"common":[205],"non-adversarial":[206],"corruptions,":[208],"indicating":[209],"that":[210],"shallow":[211],"entangling":[212],"front-ends":[214],"improve":[216],"resilience":[218],"sensitivity":[220],"additive":[222],"challenge.":[226]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
