{"id":"https://openalex.org/W2771578571","doi":"https://doi.org/10.1109/iccais.2017.8217590","title":"Multiple speaker tracking with the GLMB filter","display_name":"Multiple speaker tracking with the GLMB filter","publication_year":2017,"publication_date":"2017-10-01","ids":{"openalex":"https://openalex.org/W2771578571","doi":"https://doi.org/10.1109/iccais.2017.8217590","mag":"2771578571"},"language":"en","primary_location":{"id":"doi:10.1109/iccais.2017.8217590","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccais.2017.8217590","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 International Conference on Control, Automation and Information Sciences (ICCAIS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://figshare.com/articles/conference_contribution/Multiple_Speaker_Tracking_with_the_GLMB_Filter/27404376","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020848196","display_name":"Du Yong Kim","orcid":"https://orcid.org/0000-0001-6882-2324"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Du Yong Kim","raw_affiliation_strings":["Dept. of Electrical and Computer Engineering, Curtin University, Bentley, Australia"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, Curtin University, Bentley, Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070960013","display_name":"Ba-Tuong Vo","orcid":"https://orcid.org/0000-0002-3954-238X"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ba-Tuong Vo","raw_affiliation_strings":["Dept. of Electrical and Computer Engineering, Curtin University, Bentley, Australia"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, Curtin University, Bentley, Australia","institution_ids":["https://openalex.org/I205640436"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023874572","display_name":"Sven Nordholm","orcid":"https://orcid.org/0000-0001-8942-5328"},"institutions":[{"id":"https://openalex.org/I205640436","display_name":"Curtin University","ror":"https://ror.org/02n415q13","country_code":"AU","type":"education","lineage":["https://openalex.org/I205640436"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Sven Nordholm","raw_affiliation_strings":["Dept. of Electrical and Computer Engineering, Curtin University, Bentley, Australia"],"affiliations":[{"raw_affiliation_string":"Dept. of Electrical and Computer Engineering, Curtin University, Bentley, Australia","institution_ids":["https://openalex.org/I205640436"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5020848196"],"corresponding_institution_ids":["https://openalex.org/I205640436"],"apc_list":null,"apc_paid":null,"fwci":0.1864,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.48723187,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"5","issue":null,"first_page":"38","last_page":"43"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10711","display_name":"Target Tracking and Data Fusion in Sensor Networks","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.7168659567832947},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6832917332649231},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.6364055871963501},{"id":"https://openalex.org/keywords/spurious-relationship","display_name":"Spurious relationship","score":0.6355217695236206},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5944528579711914},{"id":"https://openalex.org/keywords/multilateration","display_name":"Multilateration","score":0.5452651381492615},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.528606116771698},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4979431629180908},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4757813513278961},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4174567759037018},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37180328369140625},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.30430448055267334},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.25730007886886597},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.09799814224243164},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.0777716338634491},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07558780908584595}],"concepts":[{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.7168659567832947},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6832917332649231},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.6364055871963501},{"id":"https://openalex.org/C97256817","wikidata":"https://www.wikidata.org/wiki/Q1462316","display_name":"Spurious relationship","level":2,"score":0.6355217695236206},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5944528579711914},{"id":"https://openalex.org/C104037064","wikidata":"https://www.wikidata.org/wiki/Q1640884","display_name":"Multilateration","level":3,"score":0.5452651381492615},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.528606116771698},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4979431629180908},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4757813513278961},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4174567759037018},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37180328369140625},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.30430448055267334},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.25730007886886597},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.09799814224243164},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0777716338634491},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07558780908584595},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C68115822","wikidata":"https://www.wikidata.org/wiki/Q1068172","display_name":"Sound pressure","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iccais.2017.8217590","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccais.2017.8217590","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 International Conference on Control, Automation and Information Sciences (ICCAIS)","raw_type":"proceedings-article"},{"id":"pmh:oai:alma.61RMIT_INST:11248142800001341","is_oa":false,"landing_page_url":"http://doi.org/10.1109/ICCAIS.2017.8217590","pdf_url":null,"source":{"id":"https://openalex.org/S4306402074","display_name":"RMIT Research Repository (RMIT University Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I82951845","host_organization_name":"RMIT University","host_organization_lineage":["https://openalex.org/I82951845"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:espace.curtin.edu.au:20.500.11937/67212","is_oa":false,"landing_page_url":"http://hdl.handle.net/20.500.11937/67212","pdf_url":null,"source":{"id":"https://openalex.org/S4306401790","display_name":"eSpace (Curtin University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205640436","host_organization_name":"Curtin University","host_organization_lineage":["https://openalex.org/I205640436"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference Paper"},{"id":"pmh:oai:figshare.com:article/27404376","is_oa":true,"landing_page_url":"https://figshare.com/articles/conference_contribution/Multiple_Speaker_Tracking_with_the_GLMB_Filter/27404376","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:figshare.com:article/27404376","is_oa":true,"landing_page_url":"https://figshare.com/articles/conference_contribution/Multiple_Speaker_Tracking_with_the_GLMB_Filter/27404376","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W34992941","https://openalex.org/W652333456","https://openalex.org/W1557595030","https://openalex.org/W1648602279","https://openalex.org/W1745301770","https://openalex.org/W1965417653","https://openalex.org/W2014787937","https://openalex.org/W2041184946","https://openalex.org/W2046317813","https://openalex.org/W2049244691","https://openalex.org/W2098957643","https://openalex.org/W2101414012","https://openalex.org/W2105905583","https://openalex.org/W2106873007","https://openalex.org/W2107493093","https://openalex.org/W2110097273","https://openalex.org/W2110354007","https://openalex.org/W2113744809","https://openalex.org/W2117678320","https://openalex.org/W2120350100","https://openalex.org/W2128970593","https://openalex.org/W2146053319","https://openalex.org/W2148613904","https://openalex.org/W2149900846","https://openalex.org/W2150704472","https://openalex.org/W2154353836","https://openalex.org/W2155167894","https://openalex.org/W2156954690","https://openalex.org/W2161435744","https://openalex.org/W2162654459","https://openalex.org/W2163994287","https://openalex.org/W2164427415","https://openalex.org/W2571592432","https://openalex.org/W2744999242","https://openalex.org/W2963272312","https://openalex.org/W4249052411","https://openalex.org/W4254263845","https://openalex.org/W6633511732","https://openalex.org/W6674665634","https://openalex.org/W6682279650","https://openalex.org/W6742696630"],"related_works":["https://openalex.org/W2380293945","https://openalex.org/W3113091479","https://openalex.org/W1500522817","https://openalex.org/W2162899405","https://openalex.org/W1974812937","https://openalex.org/W3095239554","https://openalex.org/W941090075","https://openalex.org/W3212409750","https://openalex.org/W4387088887","https://openalex.org/W17155033"],"abstract_inverted_index":{"In":[0],"this":[1],"paper":[2],"we":[3],"propose":[4],"a":[5,20],"new":[6],"solution":[7],"to":[8,100],"the":[9,39,45,74,85,90,94,104,115,119],"problem":[10],"of":[11,58,64,93],"tracking":[12,47,87],"multiple":[13,16,68],"speakers":[14,116],"from":[15,97,108],"microphone":[17],"arrays":[18],"in":[19,44,66,71,118],"reverberant":[21],"acoustic":[22,25],"environment.":[23],"The":[24,80],"environment":[26],"with":[27,32,73,84],"its":[28,33],"complex":[29],"reflection":[30],"patterns":[31],"underlying":[34],"data":[35,98,101],"association":[36],"uncertainty":[37],"pose":[38],"two":[40],"most":[41],"significant":[42],"challenges":[43],"multi-speaker":[46],"problem.":[48],"We":[49],"provide":[50],"an":[51],"approach":[52],"that":[53],"employs":[54],"individual":[55],"Time":[56],"Difference":[57],"Arrival":[59],"measurements":[60,82,106],"collected":[61],"by":[62],"pairs":[63,70],"microphones":[65],"using":[67],"distributed":[69,81],"conjunction":[72],"Generalized":[75],"Labeled":[76],"Multi-Bernoulli":[77],"(GLMB)":[78],"tracker.":[79],"together":[83],"GLMB":[86],"filter":[88],"exploits":[89],"spatiotemporal":[91],"correlation":[92],"true":[95],"sources":[96],"frame":[99],"frame,":[102],"whereas":[103],"spurious":[105],"arising":[107],"reverberations":[109],"exhibit":[110],"no":[111],"temporal":[112],"consistency":[113],"as":[114],"move":[117],"room.":[120]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
