{"id":"https://openalex.org/W2139301611","doi":"https://doi.org/10.1109/icassp.2011.5947432","title":"Cross-Channel Spectral Subtraction for meeting speech recognition","display_name":"Cross-Channel Spectral Subtraction for meeting speech recognition","publication_year":2011,"publication_date":"2011-05-01","ids":{"openalex":"https://openalex.org/W2139301611","doi":"https://doi.org/10.1109/icassp.2011.5947432","mag":"2139301611"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2011.5947432","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2011.5947432","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://t2r2.star.titech.ac.jp/rrws/file/CTT100624006/ATD100000413/","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063793244","display_name":"Yu Nasu","orcid":null},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yu Nasu","raw_affiliation_strings":["Tokyo Institute of Technology, Meguro, Tokyo, Japan","Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan#TAB#"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Meguro, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]},{"raw_affiliation_string":"Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan#TAB#","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081629487","display_name":"Koichi Shinoda","orcid":"https://orcid.org/0000-0003-1095-3203"},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Koichi Shinoda","raw_affiliation_strings":["Tokyo Institute of Technology, Meguro, Tokyo, Japan","Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan#TAB#"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Meguro, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]},{"raw_affiliation_string":"Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan#TAB#","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009532108","display_name":"Sadaoki Furui","orcid":null},"institutions":[{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Sadaoki Furui","raw_affiliation_strings":["Tokyo Institute of Technology, Meguro, Tokyo, Japan","Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan#TAB#"],"affiliations":[{"raw_affiliation_string":"Tokyo Institute of Technology, Meguro, Tokyo, Japan","institution_ids":["https://openalex.org/I114531698"]},{"raw_affiliation_string":"Tokyo Institute of Technology, 2-12-1 Ookayama, Meguro-ku, 152-8552 Japan#TAB#","institution_ids":["https://openalex.org/I114531698"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5063793244"],"corresponding_institution_ids":["https://openalex.org/I114531698"],"apc_list":null,"apc_paid":null,"fwci":1.2478,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.80688399,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"2","issue":null,"first_page":"4812","last_page":"4815"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7527343034744263},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7497623562812805},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.6082693934440613},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.5791738033294678},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5545507669448853},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.5328583717346191},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.508759081363678},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.5076626539230347},{"id":"https://openalex.org/keywords/subtraction","display_name":"Subtraction","score":0.49603256583213806},{"id":"https://openalex.org/keywords/independent-component-analysis","display_name":"Independent component analysis","score":0.4705807566642761},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4475489556789398},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.44290825724601746},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.44119778275489807},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.4168117344379425},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.41436949372291565},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3940165042877197},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0886090099811554},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.08299487829208374},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08261221647262573},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.060781240463256836},{"id":"https://openalex.org/keywords/amplifier","display_name":"Amplifier","score":0.059928953647613525}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7527343034744263},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7497623562812805},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.6082693934440613},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.5791738033294678},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5545507669448853},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.5328583717346191},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.508759081363678},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.5076626539230347},{"id":"https://openalex.org/C68060419","wikidata":"https://www.wikidata.org/wiki/Q40754","display_name":"Subtraction","level":2,"score":0.49603256583213806},{"id":"https://openalex.org/C51432778","wikidata":"https://www.wikidata.org/wiki/Q1259145","display_name":"Independent component analysis","level":2,"score":0.4705807566642761},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4475489556789398},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.44290825724601746},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.44119778275489807},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4168117344379425},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.41436949372291565},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3940165042877197},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0886090099811554},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.08299487829208374},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08261221647262573},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.060781240463256836},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.059928953647613525},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2011.5947432","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2011.5947432","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:t2r2.star.titech.ac.jp:50140974","is_oa":true,"landing_page_url":"http://t2r2.star.titech.ac.jp/cgi-bin/publicationinfo.cgi?q_publication_content_number=CTT100624006","pdf_url":"http://t2r2.star.titech.ac.jp/rrws/file/CTT100624006/ATD100000413/","source":{"id":"https://openalex.org/S4377196385","display_name":"Tokyo Tech Research Repository (Tokyo Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I114531698","host_organization_name":"Tokyo Institute of Technology","host_organization_lineage":["https://openalex.org/I114531698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"}],"best_oa_location":{"id":"pmh:oai:t2r2.star.titech.ac.jp:50140974","is_oa":true,"landing_page_url":"http://t2r2.star.titech.ac.jp/cgi-bin/publicationinfo.cgi?q_publication_content_number=CTT100624006","pdf_url":"http://t2r2.star.titech.ac.jp/rrws/file/CTT100624006/ATD100000413/","source":{"id":"https://openalex.org/S4377196385","display_name":"Tokyo Tech Research Repository (Tokyo Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I114531698","host_organization_name":"Tokyo Institute of Technology","host_organization_lineage":["https://openalex.org/I114531698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.46000000834465027,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G1158531229","display_name":"A study of multimodal recognition for human communication search","funder_award_id":"20300063","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3236194794","display_name":null,"funder_award_id":"Grant-in-Aid","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7167128334","display_name":null,"funder_award_id":"Grant-in-Aid for Scientific Researc","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7337825077","display_name":null,"funder_award_id":"Grant-in-Aid for Sc","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G7531875455","display_name":"\u5927\u90fd\u5e02\u306a\u3089\u3073\u306b\u305d\u306e\u5468\u8fba\u5730\u57df\u306b\u304a\u3051\u308b\u5bb6\u5185\u52b4\u529b\u306e\u5b9f\u8a3c\u7684\u7814\u7a76\u2015\u3068\u304f\u306b\u5927\u962a\u3092\u4e2d\u5fc3\u3068\u3057\u3066\u2015","funder_award_id":"30006","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8759943101","display_name":null,"funder_award_id":"rant-in-Aid for Scientific Research","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2139301611.pdf","grobid_xml":"https://content.openalex.org/works/W2139301611.grobid-xml"},"referenced_works_count":10,"referenced_works":["https://openalex.org/W16236365","https://openalex.org/W37526647","https://openalex.org/W1558276682","https://openalex.org/W2027884847","https://openalex.org/W2037592772","https://openalex.org/W2108384452","https://openalex.org/W2128653836","https://openalex.org/W2158336491","https://openalex.org/W4285719527","https://openalex.org/W6601563604"],"related_works":["https://openalex.org/W2118307209","https://openalex.org/W2107364365","https://openalex.org/W2046761971","https://openalex.org/W2553224454","https://openalex.org/W4281722104","https://openalex.org/W2803458999","https://openalex.org/W2765453402","https://openalex.org/W1497843931","https://openalex.org/W1503525627","https://openalex.org/W1785857632"],"abstract_inverted_index":{"We":[0],"propose":[1],"Cross-Channel":[2],"Spectral":[3],"Subtraction":[4],"(CCSS),":[5],"a":[6,73],"source":[7,45],"separation":[8,46],"method":[9,23],"for":[10,19],"recognizing":[11],"meeting":[12],"speech":[13,38,67,97],"where":[14],"one":[15],"microphone":[16],"is":[17],"prepared":[18],"each":[20],"speaker.":[21],"The":[22],"quickly":[24],"adapts":[25],"to":[26,35,87],"changes":[27],"in":[28,99],"transfer":[29],"functions":[30],"and":[31,64],"uses":[32],"spectral":[33],"subtraction":[34],"suppress":[36],"the":[37,65,82,93],"of":[39,76,96],"other":[40],"speakers.":[41],"Compared":[42],"with":[43],"conventional":[44],"methods":[47],"based":[48],"on":[49],"independent":[50],"component":[51],"analysis":[52],"(ICA)":[53],"or":[54],"that":[55],"use":[56],"binary":[57],"masks,":[58],"it":[59],"requires":[60],"less":[61,70],"computational":[62],"costs":[63],"resulting":[66],"signals":[68],"have":[69],"distortion.":[71],"In":[72],"recognition":[74,94],"task":[75],"computer-simulated,":[77],"partially-overlapped":[78],"speech,":[79],"CCSS":[80],"improved":[81,92],"word":[83],"accuracy":[84,95],"from":[85],"66.5%":[86],"77.7%.":[88],"It":[89],"also":[90],"significantly":[91],"data":[98],"actual":[100],"meetings.":[101]},"counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
