{"id":"https://openalex.org/W4416250842","doi":"https://doi.org/10.1109/waspaa66052.2025.11231004","title":"Combolutional Neural Networks","display_name":"Combolutional Neural Networks","publication_year":2025,"publication_date":"2025-10-12","ids":{"openalex":"https://openalex.org/W4416250842","doi":"https://doi.org/10.1109/waspaa66052.2025.11231004"},"language":null,"primary_location":{"id":"doi:10.1109/waspaa66052.2025.11231004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa66052.2025.11231004","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094040174","display_name":"Cameron Churchwell","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Cameron Churchwell","raw_affiliation_strings":["University of Illinois at Urbana-Champaign,Siebel School of Computing and Data Science,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign,Siebel School of Computing and Data Science,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064582903","display_name":"Minje Kim","orcid":"https://orcid.org/0000-0003-3513-8328"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Minje Kim","raw_affiliation_strings":["University of Illinois at Urbana-Champaign,Siebel School of Computing and Data Science,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign,Siebel School of Computing and Data Science,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038903729","display_name":"Paris Smaragdis","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Paris Smaragdis","raw_affiliation_strings":["University of Illinois at Urbana-Champaign,Siebel School of Computing and Data Science,Urbana,IL,USA,61801"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign,Siebel School of Computing and Data Science,Urbana,IL,USA,61801","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5094040174"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.45268462,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.7771999835968018,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.7771999835968018,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.11919999867677689,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.03280000016093254,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6743000149726868},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.5982000231742859},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5246999859809875},{"id":"https://openalex.org/keywords/envelope","display_name":"Envelope (radar)","score":0.5202000141143799},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5026999711990356},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.47440001368522644},{"id":"https://openalex.org/keywords/infinite-impulse-response","display_name":"Infinite impulse response","score":0.4553999900817871},{"id":"https://openalex.org/keywords/harmonic","display_name":"Harmonic","score":0.4399999976158142}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7440000176429749},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6743000149726868},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.5982000231742859},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5246999859809875},{"id":"https://openalex.org/C65155139","wikidata":"https://www.wikidata.org/wiki/Q5380912","display_name":"Envelope (radar)","level":3,"score":0.5202000141143799},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5026999711990356},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.47440001368522644},{"id":"https://openalex.org/C183816354","wikidata":"https://www.wikidata.org/wiki/Q665617","display_name":"Infinite impulse response","level":4,"score":0.4553999900817871},{"id":"https://openalex.org/C127934551","wikidata":"https://www.wikidata.org/wiki/Q1148098","display_name":"Harmonic","level":2,"score":0.4399999976158142},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43459999561309814},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.392300009727478},{"id":"https://openalex.org/C19247436","wikidata":"https://www.wikidata.org/wiki/Q192727","display_name":"Physical layer","level":3,"score":0.3741999864578247},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3452000021934509},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3158000111579895},{"id":"https://openalex.org/C117468950","wikidata":"https://www.wikidata.org/wiki/Q208074","display_name":"Network layer","level":3,"score":0.3043000102043152},{"id":"https://openalex.org/C124086623","wikidata":"https://www.wikidata.org/wiki/Q5994","display_name":"Piano","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.2782999873161316},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/waspaa66052.2025.11231004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa66052.2025.11231004","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1498436455","https://openalex.org/W1635512741","https://openalex.org/W2045135321","https://openalex.org/W2064675550","https://openalex.org/W2068470708","https://openalex.org/W2147800946","https://openalex.org/W2519091744","https://openalex.org/W2952218014","https://openalex.org/W2954698171","https://openalex.org/W2964051853","https://openalex.org/W2964052309","https://openalex.org/W3196974791","https://openalex.org/W4293363567","https://openalex.org/W4385245566"],"related_works":[],"abstract_inverted_index":{"Selecting":[0],"appropriate":[1],"inductive":[2],"biases":[3],"is":[4,88,102],"an":[5,89],"essential":[6],"step":[7],"in":[8,50,95],"the":[9,34,51,56,59,85,113],"design":[10],"of":[11,27,58],"machine":[12],"learning":[13],"models,":[14],"especially":[15],"when":[16],"working":[17],"with":[18],"audio,":[19],"where":[20,98],"even":[21],"short":[22],"clips":[23],"may":[24],"contain":[25],"millions":[26],"samples.":[28],"To":[29],"this":[30],"end,":[31],"we":[32],"propose":[33],"combolutional":[35,60,86,114],"layer:":[36],"a":[37],"learned-delay":[38],"IIR":[39],"comb":[40],"filter":[41],"and":[42,76,109,134],"fused":[43],"envelope":[44],"detector,":[45],"which":[46],"extracts":[47],"harmonic":[48,100],"features":[49],"time":[52],"domain.":[53],"We":[54,82],"demonstrate":[55],"efficacy":[57],"layer":[61,87,115],"on":[62],"three":[63],"information":[64],"retrieval":[65],"tasks,":[66],"evaluate":[67],"its":[68],"computational":[69],"cost":[70],"relative":[71],"to":[72],"other":[73,118],"audio":[74,96],"frontends,":[75,123],"provide":[77],"efficient":[78,128],"implementations":[79],"for":[80,92],"training.":[81],"find":[83],"that":[84],"effective":[90],"replacement":[91],"convolutional":[93],"layers":[94],"tasks":[97],"precise":[99],"analysis":[101],"important,":[103],"e.g.,":[104],"piano":[105],"transcription,":[106],"speaker":[107],"classification,":[108],"key":[110,119],"detection.":[111],"Additionally,":[112],"has":[116],"several":[117],"benefits":[120],"over":[121],"existing":[122],"namely:":[124],"low":[125],"parameter":[126],"count,":[127],"CPU":[129],"inference,":[130],"strictly":[131],"real-valued":[132],"computations,":[133],"improved":[135],"interpretability.":[136]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-14T00:00:00"}
