{"id":"https://openalex.org/W2165325039","doi":"https://doi.org/10.1109/asru.2007.4430086","title":"Minimum mutual information beamforming for simultaneous active speakers","display_name":"Minimum mutual information beamforming for simultaneous active speakers","publication_year":2007,"publication_date":"2007-01-01","ids":{"openalex":"https://openalex.org/W2165325039","doi":"https://doi.org/10.1109/asru.2007.4430086","mag":"2165325039"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2007.4430086","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2007.4430086","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE Workshop on Automatic Speech Recognition &amp; Understanding (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://infoscience.epfl.ch/record/146096","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053915317","display_name":"Kenichi Kumatani","orcid":null},"institutions":[{"id":"https://openalex.org/I7495430","display_name":"Idiap Research Institute","ror":"https://ror.org/05932h694","country_code":"CH","type":"facility","lineage":["https://openalex.org/I7495430"]},{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["CH","DE"],"is_corresponding":true,"raw_author_name":"Kenichi Kumatani","raw_affiliation_strings":["Idiap Research Institute, Switzerland","Intelligent Sensor-Actuator Systems (ISAS), University of Karlsruhe, Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Idiap Research Institute, Switzerland","institution_ids":["https://openalex.org/I7495430"]},{"raw_affiliation_string":"Intelligent Sensor-Actuator Systems (ISAS), University of Karlsruhe, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045638097","display_name":"Uwe Mayer","orcid":"https://orcid.org/0000-0001-6841-0282"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Uwe Mayer","raw_affiliation_strings":["Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006308425","display_name":"Tobias Gehrig","orcid":null},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tobias Gehrig","raw_affiliation_strings":["Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064739113","display_name":"Emilian Stoimenov","orcid":null},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Emilian Stoimenov","raw_affiliation_strings":["Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106034394","display_name":"John McDonough","orcid":null},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]},{"id":"https://openalex.org/I91712215","display_name":"Saarland University","ror":"https://ror.org/01jdpyv68","country_code":"DE","type":"education","lineage":["https://openalex.org/I91712215"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"John McDonough","raw_affiliation_strings":["Intelligent Sensor-Actuator Systems (ISAS), University of Karlsruhe, Karlsruhe, Germany","Spoken Language Systems, University of Saarland, Saarbruecken, Germany"],"affiliations":[{"raw_affiliation_string":"Intelligent Sensor-Actuator Systems (ISAS), University of Karlsruhe, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]},{"raw_affiliation_string":"Spoken Language Systems, University of Saarland, Saarbruecken, Germany","institution_ids":["https://openalex.org/I91712215"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064051745","display_name":"Matthias W\u00f6lfel","orcid":"https://orcid.org/0000-0003-1601-5146"},"institutions":[{"id":"https://openalex.org/I102335020","display_name":"Karlsruhe Institute of Technology","ror":"https://ror.org/04t3en479","country_code":"DE","type":"education","lineage":["https://openalex.org/I102335020","https://openalex.org/I1305996414"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias Wolfel","raw_affiliation_strings":["Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany"],"affiliations":[{"raw_affiliation_string":"Institute for Theoretical Computer Science, University of Karlsruhe, Karlsruhe, Germany","institution_ids":["https://openalex.org/I102335020"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5053915317"],"corresponding_institution_ids":["https://openalex.org/I102335020","https://openalex.org/I7495430"],"apc_list":null,"apc_paid":null,"fwci":1.297,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.82121503,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"71","last_page":"76"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.6872652173042297},{"id":"https://openalex.org/keywords/beamforming","display_name":"Beamforming","score":0.591282844543457},{"id":"https://openalex.org/keywords/adaptive-beamformer","display_name":"Adaptive beamformer","score":0.5767685174942017},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5628610849380493},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.555996298789978},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5558665990829468},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.503490149974823},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.436161607503891},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.33897194266319275},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3195488452911377},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.12212666869163513},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07647112011909485}],"concepts":[{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.6872652173042297},{"id":"https://openalex.org/C54197355","wikidata":"https://www.wikidata.org/wiki/Q5782992","display_name":"Beamforming","level":2,"score":0.591282844543457},{"id":"https://openalex.org/C33378366","wikidata":"https://www.wikidata.org/wiki/Q4680719","display_name":"Adaptive beamformer","level":3,"score":0.5767685174942017},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5628610849380493},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.555996298789978},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5558665990829468},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.503490149974823},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.436161607503891},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33897194266319275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3195488452911377},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.12212666869163513},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07647112011909485},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/asru.2007.4430086","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2007.4430086","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2007 IEEE Workshop on Automatic Speech Recognition &amp; Understanding (ASRU)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.142.8813","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.142.8813","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://isl.ira.uka.de/~wolfel/04430086.pdf","raw_type":"text"},{"id":"pmh:oai:infoscience.epfl.ch:146096","is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/146096","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:infoscience.epfl.ch:146096","is_oa":true,"landing_page_url":"http://infoscience.epfl.ch/record/146096","pdf_url":null,"source":{"id":"https://openalex.org/S4306400487","display_name":"Infoscience (Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.44999998807907104}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W66216379","https://openalex.org/W181370797","https://openalex.org/W653761051","https://openalex.org/W1481646516","https://openalex.org/W1493163583","https://openalex.org/W1592671018","https://openalex.org/W1599512239","https://openalex.org/W1823291590","https://openalex.org/W2002342963","https://openalex.org/W2036494998","https://openalex.org/W2097003869","https://openalex.org/W2104160473","https://openalex.org/W2117678320","https://openalex.org/W2119243469","https://openalex.org/W2123649031","https://openalex.org/W2133270663","https://openalex.org/W2134910060","https://openalex.org/W2135346934","https://openalex.org/W2139737683","https://openalex.org/W2144523485","https://openalex.org/W2146871184","https://openalex.org/W2147166770","https://openalex.org/W2148457491","https://openalex.org/W2398121140","https://openalex.org/W2798766386","https://openalex.org/W3010782316","https://openalex.org/W4235358177","https://openalex.org/W4248145103","https://openalex.org/W6602649738","https://openalex.org/W6638410079"],"related_works":["https://openalex.org/W876328409","https://openalex.org/W818226659","https://openalex.org/W2996333928","https://openalex.org/W2009075871","https://openalex.org/W2132841313","https://openalex.org/W2518591292","https://openalex.org/W1976800395","https://openalex.org/W2105408150","https://openalex.org/W2606661315","https://openalex.org/W2548445082"],"abstract_inverted_index":{"In":[0,30,56,135],"this":[1],"work,":[2],"we":[3,35,68],"address":[4],"an":[5],"acoustic":[6],"beamforming":[7],"application":[8],"where":[9],"two":[10,48],"speakers":[11],"are":[12,98],"simultaneously":[13],"active.":[14],"We":[15,110],"construct":[16],"one":[17],"subband":[18,66],"domain":[19],"beamformer":[20,140,152],"in":[21,101],"generalized":[22],"sidelobe":[23],"canceller":[24],"(GSC)":[25],"configuration":[26],"for":[27,178],"each":[28],"source.":[29],"contrast":[31],"to":[32,46,58,90,107,165],"normal":[33],"practice,":[34],"then":[36],"jointly":[37],"adjust":[38],"the":[39,60,64,76,91,112,130,136,138,176],"active":[40],"weight":[41],"vectors":[42],"of":[43,63,93,114,121,147],"both":[44],"GSCs":[45],"obtain":[47],"output":[49],"signals":[50],"with":[51,168,181],"minimum":[52],"mutual":[53,61],"information":[54,62],"(MMI).":[55],"order":[57],"calculate":[59],"complex":[65],"snapshots,":[67],"consider":[69],"four":[70],"probability":[71],"density":[72,95],"functions":[73,96],"(pdfs),":[74],"namely":[75],"Gaussian,":[77],"Laplace,":[78],"K":[79,170],"<inf":[80,171],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[81,172],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">0</inf>":[82,173],"and":[83],"\u0413":[84],"pdfs.":[85],"The":[86,150],"latter":[87],"three":[88],"belong":[89],"class":[92],"super-Gaussian":[94],"that":[97],"typically":[99],"used":[100],"independent":[102],"component":[103],"analysis":[104],"as":[105],"opposed":[106],"conventional":[108],"beamforming.":[109],"demonstrate":[111],"effectiveness":[113],"our":[115],"proposed":[116],"technique":[117],"through":[118],"a":[119,142,154,169],"series":[120],"far-field":[122],"automatic":[123],"speech":[124],"recognition":[125],"experiments":[126],"on":[127],"data":[128,179],"from":[129],"PASCAL":[131],"Speech":[132],"Separation":[133],"Challenge.":[134],"experiments,":[137],"delay-and-sum":[139],"achieved":[141,157],"word":[143],"error":[144],"rate":[145],"(WER)":[146],"70.4":[148],"%.":[149,186],"MMI":[151],"under":[153],"Gaussian":[155],"assumption":[156],"55.2":[158],"%":[159,167],"WER":[160,177],"which":[161],"was":[162,184],"further":[163],"reduced":[164],"52.0":[166],"pdf,":[174],"whereas":[175],"recorded":[180],"close-talking":[182],"microphone":[183],"21.6":[185]},"counts_by_year":[{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
