{"id":"https://openalex.org/W4401416441","doi":"https://doi.org/10.1109/taslp.2024.3440638","title":"Coarse-to-Fine Target Speaker Extraction Based on Contextual Information Exploitation","display_name":"Coarse-to-Fine Target Speaker Extraction Based on Contextual Information Exploitation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4401416441","doi":"https://doi.org/10.1109/taslp.2024.3440638"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2024.3440638","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3440638","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100585683","display_name":"Xue Yang","orcid":"https://orcid.org/0000-0002-4146-9177"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xue Yang","raw_affiliation_strings":["Institute of Speech and Audio Information Processing, School of Information Science and Technology, Beijing University of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Speech and Audio Information Processing, School of Information Science and Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070475244","display_name":"Changchun Bao","orcid":"https://orcid.org/0000-0002-5606-5343"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changchun Bao","raw_affiliation_strings":["Institute of Speech and Audio Information Processing, School of Information Science and Technology, Beijing University of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Speech and Audio Information Processing, School of Information Science and Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059065171","display_name":"Xianhong Chen","orcid":"https://orcid.org/0000-0002-5001-0587"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xianhong Chen","raw_affiliation_strings":["Institute of Speech and Audio Information Processing, School of Information Science and Technology, Beijing University of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Speech and Audio Information Processing, School of Information Science and Technology, Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100585683"],"corresponding_institution_ids":["https://openalex.org/I37796252"],"apc_list":null,"apc_paid":null,"fwci":2.4187,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.89743997,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"32","issue":null,"first_page":"3795","last_page":"3810"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9678999781608582,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9678999781608582,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9595999717712402,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.6675602793693542},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5369840264320374},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3301636278629303},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.07729065418243408},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.055841654539108276}],"concepts":[{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.6675602793693542},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5369840264320374},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3301636278629303},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.07729065418243408},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.055841654539108276}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2024.3440638","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3440638","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3862795372","display_name":null,"funder_award_id":"62006010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3909335432","display_name":null,"funder_award_id":"61831019","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":73,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W2064675550","https://openalex.org/W2127851351","https://openalex.org/W2135158232","https://openalex.org/W2141998673","https://openalex.org/W2221409856","https://openalex.org/W2891833136","https://openalex.org/W2909607850","https://openalex.org/W2924115626","https://openalex.org/W2938646939","https://openalex.org/W2939771864","https://openalex.org/W2951130829","https://openalex.org/W2962866211","https://openalex.org/W2964058413","https://openalex.org/W2964171275","https://openalex.org/W2972541922","https://openalex.org/W2972802573","https://openalex.org/W2972922524","https://openalex.org/W2973062255","https://openalex.org/W3012065388","https://openalex.org/W3015191643","https://openalex.org/W3015199127","https://openalex.org/W3015623828","https://openalex.org/W3015636705","https://openalex.org/W3015915076","https://openalex.org/W3016361963","https://openalex.org/W3024147341","https://openalex.org/W3094806148","https://openalex.org/W3096090308","https://openalex.org/W3096214032","https://openalex.org/W3096730413","https://openalex.org/W3096893582","https://openalex.org/W3097353642","https://openalex.org/W3097653961","https://openalex.org/W3103434036","https://openalex.org/W3120336970","https://openalex.org/W3136499730","https://openalex.org/W3160464260","https://openalex.org/W3162534564","https://openalex.org/W3196570692","https://openalex.org/W3198234746","https://openalex.org/W3198575250","https://openalex.org/W3206706278","https://openalex.org/W4200634403","https://openalex.org/W4224919629","https://openalex.org/W4224936432","https://openalex.org/W4225302959","https://openalex.org/W4225592424","https://openalex.org/W4225905067","https://openalex.org/W4226021932","https://openalex.org/W4226185896","https://openalex.org/W4226338831","https://openalex.org/W4232747912","https://openalex.org/W4289665794","https://openalex.org/W4296068983","https://openalex.org/W4296070363","https://openalex.org/W4296070366","https://openalex.org/W4319862644","https://openalex.org/W4367597591","https://openalex.org/W4372260086","https://openalex.org/W4372271325","https://openalex.org/W4385756463","https://openalex.org/W4385807442","https://openalex.org/W4385822691","https://openalex.org/W4385822827","https://openalex.org/W4385823017","https://openalex.org/W4385823352","https://openalex.org/W4388342027","https://openalex.org/W4392902910","https://openalex.org/W4392903092","https://openalex.org/W4392908343","https://openalex.org/W4395471087","https://openalex.org/W6631190155"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"To":[0,102],"address":[1,103],"the":[2,6,17,32,38,42,57,66,79,85,96,100,112,116,135,148,152,162,166,173,177,181,189,197,201,213],"cocktail":[3],"party":[4],"problem,":[5],"target":[7,33,58,80],"speaker":[8,34,59],"extraction":[9,199,202],"(TSE)":[10],"has":[11],"received":[12,40,67,155],"increasing":[13],"attention":[14],"recently.":[15],"Typically,":[16],"TSE":[18,76],"is":[19,27,35,52,141,185,224,243],"explored":[20],"in":[21,115],"two":[22,47],"scenarios.":[23,248],"The":[24,49,192,236],"first":[25],"scenario":[26,51,211],"a":[28,53,106],"specific":[29,136],"one,":[30,55],"where":[31,56,212],"present":[36,62],"and":[37,65,154,215,242],"signal":[39,68,184],"by":[41,127],"microphone":[43],"contains":[44],"at":[45],"least":[46],"speakers.":[48,74],"second":[50],"universal":[54,210,234],"may":[60,69,92],"be":[61],"or":[63,72],"absent":[64],"contain":[70],"one":[71],"multiple":[73],"Numerous":[75],"studies":[77],"utilize":[78],"speaker's":[81],"embedding":[82,91],"to":[83,143,161,187,226],"guide":[84,188],"extraction.":[86,175,191],"However,":[87],"solely":[88],"utilizing":[89],"this":[90,104,125,205,232],"not":[93,218],"fully":[94],"leverage":[95],"contextual":[97,113],"information":[98,114],"within":[99],"enrollment.":[101],"limitation,":[105],"novel":[107],"approach":[108,126],"that":[109,168],"directly":[110],"exploits":[111],"time-frequency":[117],"(T-F)":[118],"domain":[119],"was":[120],"proposed.":[121],"This":[122,157],"paper":[123,206],"improves":[124],"integrating":[128],"our":[129,228],"previously":[130],"proposed":[131,229,237],"coarse-to-fine":[132],"framework.":[133],"For":[134],"scenario,":[137],"an":[138,208],"interaction":[139,146,159],"block":[140],"employed":[142],"facilitate":[144],"direct":[145,158],"between":[147],"T-F":[149,178],"representations":[150],"of":[151,165,180],"enrollment":[153,167],"signal.":[156],"leads":[160],"consistent":[163],"representation":[164,179,194],"serves":[169],"as":[170],"guidance":[171],"for":[172,231,246],"coarse":[174],"Afterwards,":[176],"coarsely":[182],"extracted":[183],"utilized":[186],"refining":[190,198],"residual":[193],"obtained":[195],"during":[196],"increases":[200],"precision.":[203],"Besides,":[204],"explores":[207],"undisturbed":[209,233],"noise":[214],"reverberation":[216],"are":[217],"considered.":[219],"A":[220],"two-level":[221],"decision-making":[222],"scheme":[223],"devised":[225],"generalize":[227],"method":[230,238],"scenario.":[235],"achieves":[239],"high":[240],"performance":[241],"proven":[244],"effective":[245],"both":[247]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
