{"id":"https://openalex.org/W4375868819","doi":"https://doi.org/10.1109/icassp49357.2023.10097121","title":"Selinet: A Lightweight Model for Single Channel Speech Separation","display_name":"Selinet: A Lightweight Model for Single Channel Speech Separation","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4375868819","doi":"https://doi.org/10.1109/icassp49357.2023.10097121"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10097121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10097121","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056726536","display_name":"Ha Minh Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I22265921","display_name":"National Central University","ror":"https://ror.org/00944ve71","country_code":"TW","type":"education","lineage":["https://openalex.org/I22265921"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Ha Minh Tan","raw_affiliation_strings":["National Central University,Dept. of Computer Science and Information Engineering,Taiwan","Dept. of Computer Science and Information Engineering, National Central University, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Central University,Dept. of Computer Science and Information Engineering,Taiwan","institution_ids":["https://openalex.org/I22265921"]},{"raw_affiliation_string":"Dept. of Computer Science and Information Engineering, National Central University, Taiwan","institution_ids":["https://openalex.org/I22265921"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001193118","display_name":"Duc-Quang Vu","orcid":"https://orcid.org/0000-0001-5458-3713"},"institutions":[{"id":"https://openalex.org/I4387154701","display_name":"Thai Nguyen University Of Education","ror":"https://ror.org/044deqz63","country_code":null,"type":"education","lineage":["https://openalex.org/I4387154701"]},{"id":"https://openalex.org/I4210115718","display_name":"Thai Nguyen University","ror":"https://ror.org/02128gy91","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210115718"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Duc-Quang Vu","raw_affiliation_strings":["Thai Nguyen University of Education,Thai Nguyen,Vietnam","Thai Nguyen University of Education, Thai Nguyen, Vietnam"],"affiliations":[{"raw_affiliation_string":"Thai Nguyen University of Education,Thai Nguyen,Vietnam","institution_ids":["https://openalex.org/I4210115718"]},{"raw_affiliation_string":"Thai Nguyen University of Education, Thai Nguyen, Vietnam","institution_ids":["https://openalex.org/I4210115718","https://openalex.org/I4387154701"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029325015","display_name":"Jia\u2010Ching Wang","orcid":"https://orcid.org/0000-0003-0024-6732"},"institutions":[{"id":"https://openalex.org/I22265921","display_name":"National Central University","ror":"https://ror.org/00944ve71","country_code":"TW","type":"education","lineage":["https://openalex.org/I22265921"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jia-Ching Wang","raw_affiliation_strings":["National Central University,Dept. of Computer Science and Information Engineering,Taiwan","Dept. of Computer Science and Information Engineering, National Central University, Taiwan"],"affiliations":[{"raw_affiliation_string":"National Central University,Dept. of Computer Science and Information Engineering,Taiwan","institution_ids":["https://openalex.org/I22265921"]},{"raw_affiliation_string":"Dept. of Computer Science and Information Engineering, National Central University, Taiwan","institution_ids":["https://openalex.org/I22265921"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5056726536"],"corresponding_institution_ids":["https://openalex.org/I22265921"],"apc_list":null,"apc_paid":null,"fwci":3.9516,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.94746287,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.8378632068634033},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.8179938793182373},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7331530451774597},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.6517155766487122},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5952205061912537},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.5602808594703674},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.5386514663696289},{"id":"https://openalex.org/keywords/computational-resource","display_name":"Computational resource","score":0.47687608003616333},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.45004236698150635},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.42126744985580444},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4021972119808197},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.358266681432724},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2719547152519226},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.14839890599250793},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12448424100875854},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.09596827626228333}],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.8378632068634033},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.8179938793182373},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7331530451774597},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.6517155766487122},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5952205061912537},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.5602808594703674},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.5386514663696289},{"id":"https://openalex.org/C127964446","wikidata":"https://www.wikidata.org/wiki/Q1092142","display_name":"Computational resource","level":3,"score":0.47687608003616333},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.45004236698150635},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.42126744985580444},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4021972119808197},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.358266681432724},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2719547152519226},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.14839890599250793},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12448424100875854},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.09596827626228333},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10097121","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10097121","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2104978738","https://openalex.org/W2156876426","https://openalex.org/W2162915993","https://openalex.org/W2221409856","https://openalex.org/W2412782625","https://openalex.org/W2630837129","https://openalex.org/W2734774145","https://openalex.org/W2735663686","https://openalex.org/W2952218014","https://openalex.org/W2962935966","https://openalex.org/W2963163009","https://openalex.org/W2964238697","https://openalex.org/W2964309882","https://openalex.org/W2981436548","https://openalex.org/W2982083293","https://openalex.org/W2990594533","https://openalex.org/W3015199127","https://openalex.org/W3035268204","https://openalex.org/W3042857426","https://openalex.org/W3094607766","https://openalex.org/W3096893582","https://openalex.org/W3099330747","https://openalex.org/W3124972797","https://openalex.org/W3160903688","https://openalex.org/W3163652268","https://openalex.org/W3175785186","https://openalex.org/W4200529817","https://openalex.org/W4206215724","https://openalex.org/W4224931672","https://openalex.org/W4225281800","https://openalex.org/W4283794752","https://openalex.org/W4285197326","https://openalex.org/W4285274345","https://openalex.org/W4297775537","https://openalex.org/W4312575985","https://openalex.org/W4312672045","https://openalex.org/W6631190155","https://openalex.org/W6683161558","https://openalex.org/W6737664043","https://openalex.org/W6739696289","https://openalex.org/W6748481559","https://openalex.org/W6774995033"],"related_works":["https://openalex.org/W1657880117","https://openalex.org/W2595172197","https://openalex.org/W2022849497","https://openalex.org/W2407190427","https://openalex.org/W3081299480","https://openalex.org/W2919210741","https://openalex.org/W2907584218","https://openalex.org/W3002446410","https://openalex.org/W4390224712","https://openalex.org/W4322096758"],"abstract_inverted_index":{"The":[0,46],"time-domain":[1],"speech":[2,42],"separation":[3],"methods":[4],"adopting":[5],"deep":[6],"learning":[7],"have":[8],"obtained":[9],"impressive":[10,116],"performance.":[11],"However,":[12],"the":[13,22,25,49,65,71,78,88,94,121],"computational":[14,75,123],"complexity,":[15],"model":[16,72,126],"size,":[17],"and":[18,57,74,105,125],"performance":[19,117],"are":[20],"still":[21,119],"challenges":[23],"for":[24,41],"implementation":[26],"on":[27],"real-time":[28],"low-resource":[29],"devices.":[30],"In":[31,62],"this":[32],"paper,":[33],"we":[34],"introduce":[35],"a":[36,82],"lightweight":[37],"yet":[38],"effective":[39],"network":[40],"separation,":[43],"namely":[44],"SeliNet.":[45],"SeliNet":[47,113],"is":[48],"one-dimensional":[50],"convolutional":[51],"architecture":[52],"that":[53],"employs":[54],"bottleneck":[55,63],"modules,":[56,64],"atrous":[58,95],"temporal":[59,96],"pyramid":[60,97],"pooling.":[61],"depth-wise":[66],"separable":[67],"convolution":[68],"significantly":[69],"decreases":[70],"size":[73],"cost":[76,124],"meanwhile":[77],"squeeze":[79],"excitation":[80],"uses":[81],"context":[83,107],"vector":[84],"to":[85,114],"interact":[86],"with":[87],"entire":[89],"hidden":[90],"state":[91],"vector.":[92],"Specifically,":[93],"pooling":[98],"recognizes":[99],"long-time":[100],"sequences":[101],"of":[102],"various":[103],"lengths":[104],"extracts":[106],"at":[108],"different":[109],"field-of-views.":[110],"This":[111],"helps":[112],"obtain":[115],"while":[118],"maintaining":[120],"small":[122],"size.":[127]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":11}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
