{"id":"https://openalex.org/W2075360134","doi":"https://doi.org/10.1163/156855309x431659","title":"Human Tracking System Integrating Sound and Face Localization Using an Expectation-Maximization Algorithm in Real Environments","display_name":"Human Tracking System Integrating Sound and Face Localization Using an Expectation-Maximization Algorithm in Real Environments","publication_year":2009,"publication_date":"2009-01-01","ids":{"openalex":"https://openalex.org/W2075360134","doi":"https://doi.org/10.1163/156855309x431659","mag":"2075360134"},"language":"en","primary_location":{"id":"doi:10.1163/156855309x431659","is_oa":false,"landing_page_url":"https://doi.org/10.1163/156855309x431659","pdf_url":null,"source":{"id":"https://openalex.org/S192584203","display_name":"Advanced Robotics","issn_l":"0169-1864","issn":["0169-1864","1568-5535"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advanced Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111821094","display_name":"Hyun-Don Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Hyun-Don Kim","raw_affiliation_strings":["a Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"a Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049614400","display_name":"Kazunori Komatani","orcid":"https://orcid.org/0000-0002-6052-600X"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazunori Komatani","raw_affiliation_strings":["b Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"b Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055922202","display_name":"Tetsuya Ogata","orcid":"https://orcid.org/0000-0001-7015-0379"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsuya Ogata","raw_affiliation_strings":["c Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"c Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005141184","display_name":"Hiroshi G. Okuno","orcid":"https://orcid.org/0000-0002-8704-4318"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroshi G. Okuno","raw_affiliation_strings":["d Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"d Department of Intelligence Science and Technology, Graduate School of Informatics, Kyoto University, Yoshida-honmachi, Sakyo-ku, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111821094"],"corresponding_institution_ids":["https://openalex.org/I22299242"],"apc_list":null,"apc_paid":null,"fwci":1.7623,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.83818157,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"23","issue":"6","first_page":"629","last_page":"653"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7124910950660706},{"id":"https://openalex.org/keywords/acoustic-source-localization","display_name":"Acoustic source localization","score":0.6214892864227295},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5349740982055664},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5233694314956665},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5050323605537415},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4998455047607422},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.48157405853271484},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.4263034164905548},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40304839611053467},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.2200939953327179},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.18514299392700195}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7124910950660706},{"id":"https://openalex.org/C93240960","wikidata":"https://www.wikidata.org/wiki/Q217270","display_name":"Acoustic source localization","level":3,"score":0.6214892864227295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5349740982055664},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5233694314956665},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5050323605537415},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4998455047607422},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.48157405853271484},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.4263034164905548},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40304839611053467},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.2200939953327179},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.18514299392700195},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1163/156855309x431659","is_oa":false,"landing_page_url":"https://doi.org/10.1163/156855309x431659","pdf_url":null,"source":{"id":"https://openalex.org/S192584203","display_name":"Advanced Robotics","issn_l":"0169-1864","issn":["0169-1864","1568-5535"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advanced Robotics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320912","display_name":"Ministry of Education, Culture, Sports, Science and Technology","ror":"https://ror.org/048rj2z13"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1487212816","https://openalex.org/W1673002162","https://openalex.org/W1869758581","https://openalex.org/W1912147533","https://openalex.org/W1985690171","https://openalex.org/W1988790447","https://openalex.org/W2081817329","https://openalex.org/W2113638573","https://openalex.org/W2122796820","https://openalex.org/W2126049200","https://openalex.org/W2147673046","https://openalex.org/W2153458938","https://openalex.org/W2165943878","https://openalex.org/W2168351399","https://openalex.org/W2267719592","https://openalex.org/W4233385860"],"related_works":["https://openalex.org/W2103413230","https://openalex.org/W1899364738","https://openalex.org/W43171467","https://openalex.org/W2908959303","https://openalex.org/W2663901905","https://openalex.org/W2138569648","https://openalex.org/W2143020626","https://openalex.org/W2126942212","https://openalex.org/W2116300362","https://openalex.org/W2018638282"],"abstract_inverted_index":{"We":[0],"have":[1],"developed":[2,118,167],"a":[3,150,163,183,191,207],"human":[4,164],"tracking":[5,185],"system":[6,85,132,196],"for":[7,142,149],"use":[8,68],"by":[9,112,126,161],"robots":[10],"that":[11,120,194],"integrate":[12,173],"sound":[13,29,51,63,90,147],"and":[14,152,176,205],"face":[15],"localization.":[16],"Conventional":[17],"systems":[18],"usually":[19],"require":[20],"many":[21],"microphones":[22,111],"and/or":[23],"prior":[24,69],"information":[25,70,178],"to":[26,60,67,82,133,172,181],"localize":[27,61,198],"several":[28,88],"sources.":[30,91],"Moreover,":[31],"they":[32],"are":[33,98],"incapable":[34],"of":[35,40,50,94,215],"coping":[36],"with":[37,54,87,108,212],"various":[38,137,213],"types":[39,214],"background":[41,216],"noise.":[42,217],"Our":[43],"system,":[44],"the":[45,62,84,101,114,131,143,146,174,202],"cross-power":[46],"spectrum":[47],"phase":[48],"analysis":[49],"signals":[52,156],"obtained":[53],"only":[55,109],"two":[56,110,199],"microphones,":[57],"is":[58,80,105,170],"used":[59,81,171],"source":[64],"without":[65],"having":[66],"such":[71],"as":[72],"impulse":[73],"response":[74],"data.":[75],"An":[76],"expectation-maximization":[77],"(EM)":[78],"algorithm":[79,129],"help":[83],"cope":[86],"moving":[89],"The":[92],"problem":[93],"distinguishing":[95],"whether":[96],"sounds":[97,200],"coming":[99],"from":[100,158],"front":[102],"or":[103],"back":[104],"also":[106,153],"solved":[107],"rotating":[113],"robot's":[115],"head.":[116],"A":[117,166],"method":[119,169],"uses":[121],"facial":[122],"skin":[123],"colors":[124],"classified":[125],"another":[127],"EM":[128],"enables":[130],"detect":[134],"faces":[135],"in":[136,145,179,187],"poses.":[138],"It":[139],"can":[140,197],"compensate":[141],"error":[144],"localization":[148],"speaker":[151],"identify":[154],"noise":[155],"entering":[157],"undesired":[159],"directions":[160],"detecting":[162],"face.":[165],"probability-based":[168],"auditory":[175],"visual":[177],"order":[180],"produce":[182],"reliable":[184],"path":[186],"real-time.":[188],"Experiments":[189],"using":[190],"robot":[192],"showed":[193],"our":[195],"at":[201],"same":[203],"time":[204],"track":[206],"communication":[208],"partner":[209],"while":[210],"dealing":[211]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
