{"id":"https://openalex.org/W4319663835","doi":"https://doi.org/10.1109/lsp.2023.3243764","title":"Time-Domain Speech Separation Networks With Graph Encoding Auxiliary","display_name":"Time-Domain Speech Separation Networks With Graph Encoding Auxiliary","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4319663835","doi":"https://doi.org/10.1109/lsp.2023.3243764"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2023.3243764","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3243764","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100447741","display_name":"Tingting Wang","orcid":"https://orcid.org/0000-0002-6726-6458"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tingting Wang","raw_affiliation_strings":["Department of Communication and Information Engineering, Nanjing University of Posts and Telecommunications, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Department of Communication and Information Engineering, Nanjing University of Posts and Telecommunications, Nanjing, China","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060530570","display_name":"Zexu Pan","orcid":"https://orcid.org/0000-0002-8106-1176"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zexu Pan","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071074013","display_name":"Meng Ge","orcid":"https://orcid.org/0000-0003-2017-4529"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Ge","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047980942","display_name":"Zhen Yang","orcid":"https://orcid.org/0000-0002-4400-3823"},"institutions":[{"id":"https://openalex.org/I41198531","display_name":"Nanjing University of Posts and Telecommunications","ror":"https://ror.org/043bpky34","country_code":"CN","type":"education","lineage":["https://openalex.org/I41198531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Yang","raw_affiliation_strings":["Department of Communication and Information Engineering, Nanjing University of Posts and Telecommunications, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Department of Communication and Information Engineering, Nanjing University of Posts and Telecommunications, Nanjing, China","institution_ids":["https://openalex.org/I41198531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]},{"id":"https://openalex.org/I180437899","display_name":"University of Bremen","ror":"https://ror.org/04ers2y35","country_code":"DE","type":"education","lineage":["https://openalex.org/I180437899"]},{"id":"https://openalex.org/I4210099586","display_name":"Shenzhen Research Institute of Big Data","ror":"https://ror.org/00z1gwf89","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099586"]},{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN","DE","SG"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["Department of Electrical and Computer Engineering, National University of Singapore, Singapore","Kriston AI, Xiamen, China","University of Bremen, Bremen, Germany","Shenzhen Research Institute of Big Data, School of Data Science, The Chinese University of Hong Kong, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"Kriston AI, Xiamen, China","institution_ids":[]},{"raw_affiliation_string":"University of Bremen, Bremen, Germany","institution_ids":["https://openalex.org/I180437899"]},{"raw_affiliation_string":"Shenzhen Research Institute of Big Data, School of Data Science, The Chinese University of Hong Kong, Shenzhen, China","institution_ids":["https://openalex.org/I4210116924","https://openalex.org/I4210099586"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100447741"],"corresponding_institution_ids":["https://openalex.org/I41198531"],"apc_list":null,"apc_paid":null,"fwci":3.3755,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.93200273,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"30","issue":null,"first_page":"110","last_page":"114"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7591763734817505},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6638885736465454},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5379311442375183},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5355072021484375},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5304424166679382},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5217012763023376},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.50113844871521},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.46765774488449097},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46000415086746216},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.45031997561454773},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4359976649284363},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4207892417907715},{"id":"https://openalex.org/keywords/sliding-window-protocol","display_name":"Sliding window protocol","score":0.4198170602321625},{"id":"https://openalex.org/keywords/window","display_name":"Window (computing)","score":0.16010591387748718},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.13046661019325256}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7591763734817505},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6638885736465454},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5379311442375183},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5355072021484375},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5304424166679382},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5217012763023376},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.50113844871521},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.46765774488449097},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46000415086746216},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.45031997561454773},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4359976649284363},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4207892417907715},{"id":"https://openalex.org/C102392041","wikidata":"https://www.wikidata.org/wiki/Q592860","display_name":"Sliding window protocol","level":3,"score":0.4198170602321625},{"id":"https://openalex.org/C2778751112","wikidata":"https://www.wikidata.org/wiki/Q835016","display_name":"Window (computing)","level":2,"score":0.16010591387748718},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.13046661019325256},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2023.3243764","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2023.3243764","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.47999998927116394,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G2535026932","display_name":null,"funder_award_id":"62071242","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2799040894","display_name":null,"funder_award_id":"62271432","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2101491865","https://openalex.org/W2125838338","https://openalex.org/W2161763921","https://openalex.org/W2547553232","https://openalex.org/W2550143307","https://openalex.org/W2734774145","https://openalex.org/W2735663686","https://openalex.org/W2792764867","https://openalex.org/W2796431263","https://openalex.org/W2889540509","https://openalex.org/W2891405874","https://openalex.org/W2912317488","https://openalex.org/W2952218014","https://openalex.org/W2962905190","https://openalex.org/W2962935966","https://openalex.org/W2962946486","https://openalex.org/W2963317762","https://openalex.org/W2972541922","https://openalex.org/W2981976899","https://openalex.org/W3004940340","https://openalex.org/W3012995967","https://openalex.org/W3015199127","https://openalex.org/W3027008958","https://openalex.org/W3095379519","https://openalex.org/W3095449605","https://openalex.org/W3096893582","https://openalex.org/W3099330747","https://openalex.org/W3099904761","https://openalex.org/W3120190303","https://openalex.org/W3124972797","https://openalex.org/W3130206595","https://openalex.org/W3162387328","https://openalex.org/W3162475350","https://openalex.org/W3163591408","https://openalex.org/W3206008172","https://openalex.org/W3206315738","https://openalex.org/W4200524548","https://openalex.org/W4214698081","https://openalex.org/W4226062543","https://openalex.org/W4226338831","https://openalex.org/W4295308317","https://openalex.org/W6726873649","https://openalex.org/W6749825310","https://openalex.org/W6769589523","https://openalex.org/W6777776875"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2988126442","https://openalex.org/W2275988210","https://openalex.org/W2786094008","https://openalex.org/W3131501806","https://openalex.org/W2799683370","https://openalex.org/W2807745940"],"abstract_inverted_index":{"End-to-end":[0],"time-domain":[1,151],"speech":[2,21,48,84,147,152],"separation":[3,127],"with":[4,107],"masking":[5],"strategy":[6],"has":[7],"shown":[8],"its":[9],"performance":[10],"advantage,":[11],"where":[12],"a":[13,25,31,54,73,87,95,108],"1-D":[14],"convolutional":[15,110],"layer":[16],"is":[17],"used":[18],"as":[19],"the":[20,47,51,62,79,104,119,126,146],"encoder":[22],"to":[23,30,43,77],"encode":[24,103],"sliding":[26],"window":[27,41,56,88],"of":[28,64,83,89,130],"waveform":[29],"latent":[32,100,121],"feature":[33,116,122],"representation,":[34,101],"i.e.":[35],"an":[36],"embedding":[37],"vector.":[38],"A":[39],"large":[40],"leads":[42],"low":[44],"resolution":[45,59],"in":[46,86],"processing,":[49],"on":[50,133],"other":[52,150],"hand,":[53],"small":[55],"offers":[57],"high":[58,65],"but":[60],"at":[61],"expense":[63],"computational":[66],"cost.":[67],"In":[68],"this":[69],"work,":[70],"we":[71,93],"propose":[72],"graph":[74,96,109,115],"encoding":[75,142],"technique":[76,143],"model":[78],"fine":[80],"structural":[81,105],"knowledge":[82],"samples":[85],"reasonable":[90],"size.":[91],"Specifically,":[92],"build":[94],"representation":[97,117,123],"for":[98],"each":[99],"and":[102,124,128,136],"details":[106],"network":[111],"encoder.":[112],"The":[113],"encoded":[114],"complements":[118],"original":[120],"benefits":[125],"reconstruction":[129],"speech.":[131],"Experiments":[132],"various":[134],"models":[135],"datasets":[137],"show":[138],"that":[139],"our":[140],"proposed":[141],"significantly":[144],"improves":[145],"quality":[148],"over":[149],"encoders.":[153]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
