{"id":"https://openalex.org/W4408352715","doi":"https://doi.org/10.1109/icassp49660.2025.10890556","title":"Cross-Talk Detection in the IVAS Stereo Codec Based on GCC-PHAT","display_name":"Cross-Talk Detection in the IVAS Stereo Codec Based on GCC-PHAT","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408352715","doi":"https://doi.org/10.1109/icassp49660.2025.10890556"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890556","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890556","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035421144","display_name":"Vladim\u00edr Malenovsk\u00fd","orcid":null},"institutions":[{"id":"https://openalex.org/I135117807","display_name":"Universit\u00e9 de Sherbrooke","ror":"https://ror.org/00kybxq39","country_code":"CA","type":"education","lineage":["https://openalex.org/I135117807"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Vladimir Malenovsky","raw_affiliation_strings":["Universit&#x00E9; de Sherbrooke,Sherbrooke,Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Sherbrooke,Sherbrooke,Canada","institution_ids":["https://openalex.org/I135117807"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064493222","display_name":"Tommy Vaillancourt","orcid":null},"institutions":[{"id":"https://openalex.org/I135117807","display_name":"Universit\u00e9 de Sherbrooke","ror":"https://ror.org/00kybxq39","country_code":"CA","type":"education","lineage":["https://openalex.org/I135117807"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tommy Vaillancourt","raw_affiliation_strings":["Universit&#x00E9; de Sherbrooke,Sherbrooke,Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Sherbrooke,Sherbrooke,Canada","institution_ids":["https://openalex.org/I135117807"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062644401","display_name":"Milan Jelinek","orcid":null},"institutions":[{"id":"https://openalex.org/I135117807","display_name":"Universit\u00e9 de Sherbrooke","ror":"https://ror.org/00kybxq39","country_code":"CA","type":"education","lineage":["https://openalex.org/I135117807"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Milan Jelinek","raw_affiliation_strings":["Universit&#x00E9; de Sherbrooke,Sherbrooke,Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; de Sherbrooke,Sherbrooke,Canada","institution_ids":["https://openalex.org/I135117807"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008807732","display_name":"Eleni Fotopoulou","orcid":"https://orcid.org/0000-0001-7683-4616"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Eleni Fotopoulou","raw_affiliation_strings":["DSP Solutions GmbH &amp; Co. KG,Regensburg,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DSP Solutions GmbH &amp; Co. KG,Regensburg,Germany","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036973211","display_name":"Emmanuel Ravelli","orcid":null},"institutions":[{"id":"https://openalex.org/I4210124274","display_name":"Fraunhofer Institute for Integrated Circuits","ror":"https://ror.org/024ape423","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210124274","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Emmanuel Ravelli","raw_affiliation_strings":["Fraunhofer IIS,Erlangen,Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Fraunhofer IIS,Erlangen,Germany","institution_ids":["https://openalex.org/I4210124274"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02925293,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12720","display_name":"Multimedia Communication and Technology","score":0.9341999888420105,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.925599992275238,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.8257408142089844},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6413730382919312},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.257003515958786}],"concepts":[{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.8257408142089844},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6413730382919312},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.257003515958786}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890556","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890556","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:publica.fraunhofer.de:publica/490262","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/490262","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1481955708","https://openalex.org/W1558276682","https://openalex.org/W2046317813","https://openalex.org/W2087295741","https://openalex.org/W2109689012","https://openalex.org/W2141532435","https://openalex.org/W2157850507","https://openalex.org/W2968071640","https://openalex.org/W3015780472","https://openalex.org/W6630442970","https://openalex.org/W6634347048","https://openalex.org/W6772349387"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2964213236","https://openalex.org/W2163719598","https://openalex.org/W3161919736","https://openalex.org/W2387018512","https://openalex.org/W2107680156","https://openalex.org/W4301184752","https://openalex.org/W2288771647"],"abstract_inverted_index":{"In":[0],"real-time":[1],"teleconferences":[2],"over":[3],"mobile":[4],"networks,":[5],"cross-talk":[6,88,129],"can":[7,26,45],"significantly":[8],"impact":[9],"the":[10,32,49,75,82,108,116],"performance":[11,121],"of":[12],"parametric":[13,64],"stereo":[14,24,65,71,110,118],"codecs,":[15],"particularly":[16],"at":[17],"low":[18],"bitrates.":[19],"When":[20],"multiple":[21],"speakers":[22],"overlap,":[23],"quality":[25,127],"be":[27,46],"improved":[28],"by":[29],"independently":[30],"encoding":[31],"left":[33],"and":[34,67,99],"right":[35],"channels,":[36],"especially":[37],"when":[38],"inter-channel":[39],"correlation":[40],"is":[41],"low.":[42],"This":[43],"approach":[44],"implemented":[47],"using":[48],"dual-mono":[50,76],"EVS":[51,77],"coder,":[52],"for":[53,104],"example.":[54],"The":[55],"recently":[56],"standardized":[57],"3GPP":[58,83],"IVAS":[59,84,117],"codec":[60,85,119],"incorporates":[61],"both":[62],"a":[63,87,92],"model":[66,72,95],"an":[68],"independent":[69],"left/right":[70],"based":[73,96],"on":[74,97],"codec.":[78],"To":[79],"address":[80],"cross-talk,":[81],"features":[86],"classifier":[89],"that":[90,115],"uses":[91],"multivariate":[93],"statistical":[94],"GCC-PHAT":[98],"other":[100],"spatial":[101],"cues,":[102],"allowing":[103],"seamless":[105],"switching":[106],"between":[107],"two":[109],"models.":[111],"Listening":[112],"tests":[113],"show":[114],"enhances":[120],"in":[122,128],"single-talker":[123],"scenarios":[124],"while":[125],"maintaining":[126],"segments.":[130]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
