{"id":"https://openalex.org/W2135081730","doi":"https://doi.org/10.1155/s1110865702207015","title":"Separation of Audio-Visual Speech Sources: A New Approach Exploiting the Audio-Visual Coherence of Speech Stimuli","display_name":"Separation of Audio-Visual Speech Sources: A New Approach Exploiting the Audio-Visual Coherence of Speech Stimuli","publication_year":2002,"publication_date":"2002-11-28","ids":{"openalex":"https://openalex.org/W2135081730","doi":"https://doi.org/10.1155/s1110865702207015","mag":"2135081730"},"language":"en","primary_location":{"id":"doi:10.1155/s1110865702207015","is_oa":true,"landing_page_url":"https://doi.org/10.1155/s1110865702207015","pdf_url":null,"source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1155/s1110865702207015","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087166091","display_name":"David Sodoyer","orcid":"https://orcid.org/0000-0001-9081-3950"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"David Sodoyer","raw_affiliation_strings":["Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#","institution_ids":["https://openalex.org/I899635006"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001142101","display_name":"Jean\u2010Luc Schwartz","orcid":"https://orcid.org/0000-0001-8969-9185"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jean-Luc Schwartz","raw_affiliation_strings":["Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#","institution_ids":["https://openalex.org/I899635006"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020392160","display_name":"Laurent Girin","orcid":"https://orcid.org/0000-0002-9214-8760"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Laurent Girin","raw_affiliation_strings":["Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#","institution_ids":["https://openalex.org/I899635006"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046685023","display_name":"Jacob Klinkisch","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jacob Klinkisch","raw_affiliation_strings":["Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, ICP, INPG, Grenoble Cedex, France#TAB#","institution_ids":["https://openalex.org/I899635006"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055562421","display_name":"Christian Jutten","orcid":"https://orcid.org/0000-0002-4477-4847"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I177483745","display_name":"Universit\u00e9 Joseph Fourier","ror":"https://ror.org/02aj0kh94","country_code":"FR","type":"education","lineage":["https://openalex.org/I177483745"]},{"id":"https://openalex.org/I4210114274","display_name":"Laboratoire d\u2019Informatique et Syst\u00e8mes","ror":"https://ror.org/0257sgk90","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I143002897","https://openalex.org/I21491767","https://openalex.org/I4210114274"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Christian Jutten","raw_affiliation_strings":["Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","Laboratoire des Images et des Signaux, Institut National Polytechnique de Grenoble, Universit\u00e9 Joseph Fourier, LIS, INPG, Grenoble Cedex, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institut de la Communication Parl\u00e9e, Institut National Polytechnique de Grenoble, Universit\u00e9 Stendhal, CNRS UMR 5009, ICP, INPG, 46 avenue F\u00e9lix Viallet, Grenoble Cedex 1, 38031, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Laboratoire des Images et des Signaux, Institut National Polytechnique de Grenoble, Universit\u00e9 Joseph Fourier, LIS, INPG, Grenoble Cedex, France","institution_ids":["https://openalex.org/I177483745","https://openalex.org/I4210114274"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5087166091"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I899635006"],"apc_list":{"value":1140,"currency":"GBP","value_usd":1398},"apc_paid":{"value":1140,"currency":"GBP","value_usd":1398},"fwci":2.3143,"has_fulltext":true,"cited_by_count":46,"citation_normalized_percentile":{"value":0.89457639,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"2002","issue":"11","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7710028886795044},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.701183021068573},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.6013089418411255},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5604516267776489},{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.45138412714004517},{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.4485093057155609},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.439119428396225},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36553698778152466},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15919968485832214}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7710028886795044},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.701183021068573},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.6013089418411255},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5604516267776489},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.45138412714004517},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.4485093057155609},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.439119428396225},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36553698778152466},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15919968485832214},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1155/s1110865702207015","is_oa":true,"landing_page_url":"https://doi.org/10.1155/s1110865702207015","pdf_url":null,"source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:fe7866ac46bc45c3bcb1057210cc962a","is_oa":true,"landing_page_url":"https://doaj.org/article/fe7866ac46bc45c3bcb1057210cc962a","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EURASIP Journal on Advances in Signal Processing, Vol 2002, Iss 11, p 382823 (2002)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1155/s1110865702207015","is_oa":true,"landing_page_url":"https://doi.org/10.1155/s1110865702207015","pdf_url":null,"source":{"id":"https://openalex.org/S35920007","display_name":"EURASIP Journal on Advances in Signal Processing","issn_l":"1687-6172","issn":["1687-6172","1687-6180"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Advances in Signal Processing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W177229737","https://openalex.org/W586860715","https://openalex.org/W1488183088","https://openalex.org/W1977067929","https://openalex.org/W2024991751","https://openalex.org/W2038010270","https://openalex.org/W2056211671","https://openalex.org/W2091349387","https://openalex.org/W2099741732","https://openalex.org/W2122393449","https://openalex.org/W2127211243","https://openalex.org/W2128967371","https://openalex.org/W2167217202","https://openalex.org/W6659817735","https://openalex.org/W6674802330"],"related_works":["https://openalex.org/W2121231314","https://openalex.org/W2300973977","https://openalex.org/W2271369634","https://openalex.org/W2350550760","https://openalex.org/W578794879","https://openalex.org/W2025869674","https://openalex.org/W2625296515","https://openalex.org/W2052948815","https://openalex.org/W2091238608","https://openalex.org/W4386936765"],"abstract_inverted_index":{"We":[0,49,105,163],"present":[1,72,139],"a":[2,73,84,109,140,146,153,158],"new":[3],"approach":[4],"to":[5,30,82,94,124,191],"the":[6,11,22,27,45,51,95,100,113,126],"source":[7,85],"separation":[8,129,143,166,199],"problem":[9],"in":[10,157,189],"case":[12,52,101],"of":[13,24,53,58,88,102,112,116,142,148,160,173],"multiple":[14],"speech":[15,34],"signals.":[16],"The":[17],"method":[18],"is":[19,29,79,122],"based":[20],"on":[21,65,145],"use":[23],"automatic":[25],"lipreading,":[26],"objective":[28],"extract":[31],"an":[32,54],"acoustic":[33,38],"signal":[35],"from":[36],"other":[37,161],"signals":[39],"by":[40,133,152],"exploiting":[41],"its":[42,89],"coherence":[43],"with":[44,61,195],"speaker\u2032s":[46],"lip":[47],"movements.":[48],"consider":[50],"additive":[55],"stationary":[56],"mixture":[57,159],"decorrelated":[59],"sources,":[60],"no":[62],"further":[63],"assumptions":[64],"independence":[66],"or":[67,200],"non-Gaussian":[68],"character.":[69],"Firstly,":[70],"we":[71,98,138],"theoretical":[74],"framework":[75],"showing":[76],"that":[77,165],"it":[78],"indeed":[80],"possible":[81],"separate":[83],"when":[86],"some":[87],"spectral":[90,119],"characteristics":[91],"are":[92,184,187],"provided":[93],"system.":[96],"Then":[97],"address":[99],"audio-visual":[103,127],"sources.":[104,178],"show":[106,164],"how,":[107],"if":[108],"statistical":[110],"model":[111],"joint":[114],"probability":[115],"visual":[117],"and":[118,176,186],"audio":[120,198],"input":[121],"learnt":[123],"quantify":[125],"coherence,":[128],"can":[130,167],"be":[131,168],"achieved":[132],"maximizing":[134],"this":[135],"probability.":[136],"Finally,":[137],"number":[141],"results":[144],"corpus":[147],"vowel-plosive-vowel":[149],"sequences":[150],"uttered":[151],"single":[154],"speaker,":[155],"embedded":[156],"voices.":[162],"quite":[169],"good":[170],"for":[171],"mixtures":[172],"2,":[174],"3,":[175],"5":[177],"These":[179],"results,":[180],"while":[181],"very":[182],"preliminary,":[183],"encouraging,":[185],"discussed":[188],"respect":[190],"their":[192],"potential":[193],"complementarity":[194],"traditional":[196],"pure":[197],"enhancement":[201],"techniques.":[202]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":2}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
