{"id":"https://openalex.org/W2969987364","doi":"https://doi.org/10.1109/tmm.2019.2937185","title":"Audio\u2013Visual Particle Flow SMC-PHD Filtering for Multi-Speaker Tracking","display_name":"Audio\u2013Visual Particle Flow SMC-PHD Filtering for Multi-Speaker Tracking","publication_year":2019,"publication_date":"2019-08-23","ids":{"openalex":"https://openalex.org/W2969987364","doi":"https://doi.org/10.1109/tmm.2019.2937185","mag":"2969987364"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2019.2937185","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2937185","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087484078","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0001-7928-9473"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K"],"raw_orcid":"https://orcid.org/0000-0001-7928-9473","affiliations":[{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063512115","display_name":"Volkan K\u0131l\u0131\u00e7","orcid":"https://orcid.org/0000-0002-3164-1981"},"institutions":[{"id":"https://openalex.org/I250383648","display_name":"Izmir K\u00e2tip \u00c7elebi University","ror":"https://ror.org/024nx4843","country_code":"TR","type":"education","lineage":["https://openalex.org/I250383648"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Volkan Kilic","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Izmir Katip Celebi University, Cigli-Izmir, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-3164-1981","affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Izmir Katip Celebi University, Cigli-Izmir, Turkey","institution_ids":["https://openalex.org/I250383648"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059231561","display_name":"Jian Guan","orcid":"https://orcid.org/0000-0002-0945-1081"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Guan","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University, Harbin, China"],"raw_orcid":"https://orcid.org/0000-0002-0945-1081","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University, Harbin, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100676721","display_name":"Wenwu Wang","orcid":"https://orcid.org/0000-0002-8393-5703"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wenwu Wang","raw_affiliation_strings":["Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K"],"raw_orcid":"https://orcid.org/0000-0002-8393-5703","affiliations":[{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing, University of Surrey, Guildford, U.K","institution_ids":["https://openalex.org/I28290843"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":8.6786,"has_fulltext":false,"cited_by_count":70,"citation_normalized_percentile":{"value":0.98393085,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"22","issue":"4","first_page":"934","last_page":"948"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/particle-filter","display_name":"Particle filter","score":0.7775648832321167},{"id":"https://openalex.org/keywords/probability-density-function","display_name":"Probability density function","score":0.692879855632782},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.6325951814651489},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5888655781745911},{"id":"https://openalex.org/keywords/posterior-probability","display_name":"Posterior probability","score":0.5444551110267639},{"id":"https://openalex.org/keywords/degeneracy","display_name":"Degeneracy (biology)","score":0.5215675234794617},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.4141785800457001},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4135086238384247},{"id":"https://openalex.org/keywords/kalman-filter","display_name":"Kalman filter","score":0.32647714018821716},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31852346658706665},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2545035481452942},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13966473937034607},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.0750981867313385}],"concepts":[{"id":"https://openalex.org/C52421305","wikidata":"https://www.wikidata.org/wiki/Q1151499","display_name":"Particle filter","level":3,"score":0.7775648832321167},{"id":"https://openalex.org/C197055811","wikidata":"https://www.wikidata.org/wiki/Q207522","display_name":"Probability density function","level":2,"score":0.692879855632782},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.6325951814651489},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5888655781745911},{"id":"https://openalex.org/C57830394","wikidata":"https://www.wikidata.org/wiki/Q278079","display_name":"Posterior probability","level":3,"score":0.5444551110267639},{"id":"https://openalex.org/C2777727622","wikidata":"https://www.wikidata.org/wiki/Q5251772","display_name":"Degeneracy (biology)","level":2,"score":0.5215675234794617},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.4141785800457001},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4135086238384247},{"id":"https://openalex.org/C157286648","wikidata":"https://www.wikidata.org/wiki/Q846780","display_name":"Kalman filter","level":2,"score":0.32647714018821716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31852346658706665},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2545035481452942},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13966473937034607},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.0750981867313385},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tmm.2019.2937185","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2937185","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},{"id":"pmh:oai:epubs.surrey.ac.uk:852506","is_oa":false,"landing_page_url":"http://epubs.surrey.ac.uk/852506/1/LiuKGW_TMM_2019_postprint.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400680","display_name":"Surrey Research Insight Open Access (The University of Surrey)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28290843","host_organization_name":"University of Surrey","host_organization_lineage":["https://openalex.org/I28290843"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.5099999904632568,"display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G3034362336","display_name":null,"funder_award_id":"EP/P022529/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3186182679","display_name":null,"funder_award_id":"EP/L000539/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6485023388","display_name":"Signal Processing Solutions for the Networked Battlespace","funder_award_id":"EP/K014307/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7219166536","display_name":null,"funder_award_id":"EP/K014307/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8995825145","display_name":null,"funder_award_id":"EP/N014111/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320322725","display_name":"China Scholarship Council","ror":"https://ror.org/04atp4p48"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":98,"referenced_works":["https://openalex.org/W126779258","https://openalex.org/W1511984033","https://openalex.org/W1574312318","https://openalex.org/W1583773829","https://openalex.org/W1704271451","https://openalex.org/W1869546201","https://openalex.org/W1974836130","https://openalex.org/W1990511877","https://openalex.org/W1993049922","https://openalex.org/W1999616028","https://openalex.org/W2002594585","https://openalex.org/W2014787937","https://openalex.org/W2016133308","https://openalex.org/W2022681226","https://openalex.org/W2024731832","https://openalex.org/W2037971948","https://openalex.org/W2042296034","https://openalex.org/W2053257056","https://openalex.org/W2055600978","https://openalex.org/W2059397726","https://openalex.org/W2064480843","https://openalex.org/W2069963355","https://openalex.org/W2073459066","https://openalex.org/W2075228798","https://openalex.org/W2076840531","https://openalex.org/W2077611006","https://openalex.org/W2080154195","https://openalex.org/W2084637638","https://openalex.org/W2088725063","https://openalex.org/W2101295974","https://openalex.org/W2104693680","https://openalex.org/W2105905583","https://openalex.org/W2121836097","https://openalex.org/W2124156864","https://openalex.org/W2125336414","https://openalex.org/W2126736494","https://openalex.org/W2129821199","https://openalex.org/W2129866629","https://openalex.org/W2131598171","https://openalex.org/W2134049031","https://openalex.org/W2136274821","https://openalex.org/W2137585588","https://openalex.org/W2142511364","https://openalex.org/W2144617132","https://openalex.org/W2145938889","https://openalex.org/W2147953023","https://openalex.org/W2148163382","https://openalex.org/W2149197198","https://openalex.org/W2150375101","https://openalex.org/W2160337655","https://openalex.org/W2161435744","https://openalex.org/W2168634963","https://openalex.org/W2183583556","https://openalex.org/W2230388028","https://openalex.org/W2250436945","https://openalex.org/W2256115477","https://openalex.org/W2277000961","https://openalex.org/W2316138215","https://openalex.org/W2396175075","https://openalex.org/W2398679842","https://openalex.org/W2405315082","https://openalex.org/W2419508326","https://openalex.org/W2503670596","https://openalex.org/W2508946312","https://openalex.org/W2515985766","https://openalex.org/W2517955251","https://openalex.org/W2579152745","https://openalex.org/W2588791810","https://openalex.org/W2591907837","https://openalex.org/W2611660948","https://openalex.org/W2611855292","https://openalex.org/W2771578571","https://openalex.org/W2792360069","https://openalex.org/W2884554680","https://openalex.org/W2997874413","https://openalex.org/W3210825051","https://openalex.org/W4240105987","https://openalex.org/W4244486013","https://openalex.org/W4255936169","https://openalex.org/W4285719527","https://openalex.org/W6605165268","https://openalex.org/W6630776994","https://openalex.org/W6634207956","https://openalex.org/W6637510947","https://openalex.org/W6656845118","https://openalex.org/W6668990524","https://openalex.org/W6679546383","https://openalex.org/W6681158678","https://openalex.org/W6682136349","https://openalex.org/W6689236602","https://openalex.org/W6692130329","https://openalex.org/W6713360056","https://openalex.org/W6725444226","https://openalex.org/W6726308168","https://openalex.org/W6737105044","https://openalex.org/W6737167180","https://openalex.org/W6767735135","https://openalex.org/W6803993044"],"related_works":["https://openalex.org/W2353687059","https://openalex.org/W2893341095","https://openalex.org/W4241043257","https://openalex.org/W1990418105","https://openalex.org/W1971430736","https://openalex.org/W2358572162","https://openalex.org/W4242391381","https://openalex.org/W1980528650","https://openalex.org/W3199393239","https://openalex.org/W4249885815"],"abstract_inverted_index":{"Sequential":[0],"Monte":[1],"Carlo":[2],"probability":[3,77],"hypothesis":[4],"density":[5,50],"(SMC-PHD)":[6],"filtering":[7],"is":[8,65],"a":[9,39,58],"popular":[10],"method":[11],"used":[12,66],"recently":[13],"for":[14,108],"audio-visual":[15],"(AV)":[16],"multi-speaker":[17],"tracking.":[18],"However,":[19],"due":[20],"to":[21,67,74,132],"the":[22,26,34,45,48,72,75,98,102,123],"weight":[23],"degeneracy":[24],"problem,":[25],"posterior":[27,76],"distribution":[28],"can":[29],"be":[30],"represented":[31],"poorly":[32],"by":[33],"estimated":[35],"probability,":[36],"when":[37],"only":[38],"few":[40],"particles":[41,69],"are":[42,105,114,130],"present":[43],"around":[44],"peak":[46],"of":[47],"likelihood":[49],"function.":[51],"To":[52],"address":[53],"this":[54],"issue,":[55],"we":[56],"propose":[57],"new":[59,92],"framework":[60],"where":[61,97],"particle":[62,86,109],"flow":[63],"(PF)":[64],"migrate":[68],"smoothly":[70],"from":[71,101],"prior":[73],"density.":[78],"We":[79],"consider":[80],"both":[81],"zero":[82],"and":[83,89,95,126,129,137],"non-zero":[84],"diffusion":[85],"flows":[87],"(ZPF/NPF),":[88],"developed":[90],"two":[91],"algorithms,":[93],"AV-ZPF-SMC-PHD":[94],"AV-NPF-SMC-PHD,":[96],"speaker":[99],"states":[100],"previous":[103],"frames":[104],"also":[106],"considered":[107],"relocation.":[110],"The":[111],"proposed":[112],"algorithms":[113],"compared":[115],"systematically":[116],"with":[117],"several":[118],"baseline":[119],"tracking":[120,135],"methods":[121],"using":[122],"AV16.3,":[124],"AVDIAR":[125],"CLEAR":[127],"datasets,":[128],"shown":[131],"offer":[133],"improved":[134],"accuracy":[136],"average":[138],"effective":[139],"sample":[140],"size":[141],"(ESS).":[142]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":29},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":21}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
