{"id":"https://openalex.org/W2101329857","doi":"https://doi.org/10.1109/robot.2006.1641889","title":"Speaker localization among multi-faces in noisy environment by audio-visual integration","display_name":"Speaker localization among multi-faces in noisy environment by audio-visual integration","publication_year":2006,"publication_date":"2006-07-10","ids":{"openalex":"https://openalex.org/W2101329857","doi":"https://doi.org/10.1109/robot.2006.1641889","mag":"2101329857"},"language":"en","primary_location":{"id":"doi:10.1109/robot.2006.1641889","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robot.2006.1641889","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings 2006 IEEE International Conference on Robotics and Automation, 2006. ICRA 2006.","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066483539","display_name":"Hyun-Don Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I58716616","display_name":"Korea Institute of Science and Technology","ror":"https://ror.org/05kzfa883","country_code":"KR","type":"facility","lineage":["https://openalex.org/I27494661","https://openalex.org/I2801339556","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098","https://openalex.org/I4387152098","https://openalex.org/I58716616"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyun-Don Kim","raw_affiliation_strings":["Intelligent Robotics Research Center, Korea Institute of Science and Technology, Seoul, South Korea","Intelligent Robotics Res. Center, Korea Inst. of Sci. & Technol., Seoul"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Robotics Research Center, Korea Institute of Science and Technology, Seoul, South Korea","institution_ids":["https://openalex.org/I58716616"]},{"raw_affiliation_string":"Intelligent Robotics Res. Center, Korea Inst. of Sci. & Technol., Seoul","institution_ids":["https://openalex.org/I58716616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052822694","display_name":"JongSuk Choi","orcid":"https://orcid.org/0000-0002-0399-4675"},"institutions":[{"id":"https://openalex.org/I58716616","display_name":"Korea Institute of Science and Technology","ror":"https://ror.org/05kzfa883","country_code":"KR","type":"facility","lineage":["https://openalex.org/I27494661","https://openalex.org/I2801339556","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098","https://openalex.org/I4387152098","https://openalex.org/I58716616"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jong-Suk Choi","raw_affiliation_strings":["Intelligent Robotics Research Center, Korea Institute of Science and Technology, Seoul, South Korea","Intelligent Robotics Res. Center, Korea Inst. of Sci. & Technol., Seoul"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Robotics Research Center, Korea Institute of Science and Technology, Seoul, South Korea","institution_ids":["https://openalex.org/I58716616"]},{"raw_affiliation_string":"Intelligent Robotics Res. Center, Korea Inst. of Sci. & Technol., Seoul","institution_ids":["https://openalex.org/I58716616"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026078832","display_name":"Munsang Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I58716616","display_name":"Korea Institute of Science and Technology","ror":"https://ror.org/05kzfa883","country_code":"KR","type":"facility","lineage":["https://openalex.org/I27494661","https://openalex.org/I2801339556","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098","https://openalex.org/I4387152098","https://openalex.org/I58716616"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Munsang Kim","raw_affiliation_strings":["Intelligent Robotics Research Center, Korea Institute of Science and Technology, Seoul, South Korea","Intelligent Robotics Res. Center, Korea Inst. of Sci. & Technol., Seoul"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Robotics Research Center, Korea Institute of Science and Technology, Seoul, South Korea","institution_ids":["https://openalex.org/I58716616"]},{"raw_affiliation_string":"Intelligent Robotics Res. Center, Korea Inst. of Sci. & Technol., Seoul","institution_ids":["https://openalex.org/I58716616"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.5569,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.92767135,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1305","last_page":"1310"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10326","display_name":"Indoor and Outdoor Localization Technologies","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7514173984527588},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.623836874961853},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5956783890724182},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.583700954914093},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5758703351020813},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.534267008304596},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5160017013549805},{"id":"https://openalex.org/keywords/acoustic-source-localization","display_name":"Acoustic source localization","score":0.46558040380477905},{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.4459362030029297},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4322679340839386},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2000117301940918},{"id":"https://openalex.org/keywords/sound","display_name":"Sound (geography)","score":0.17990297079086304}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7514173984527588},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.623836874961853},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5956783890724182},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.583700954914093},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5758703351020813},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.534267008304596},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5160017013549805},{"id":"https://openalex.org/C93240960","wikidata":"https://www.wikidata.org/wiki/Q217270","display_name":"Acoustic source localization","level":3,"score":0.46558040380477905},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.4459362030029297},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4322679340839386},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2000117301940918},{"id":"https://openalex.org/C203718221","wikidata":"https://www.wikidata.org/wiki/Q491713","display_name":"Sound (geography)","level":2,"score":0.17990297079086304},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C114793014","wikidata":"https://www.wikidata.org/wiki/Q52109","display_name":"Geomorphology","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robot.2006.1641889","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robot.2006.1641889","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings 2006 IEEE International Conference on Robotics and Automation, 2006. ICRA 2006.","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4699999988079071,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1659812139","https://openalex.org/W1932412845","https://openalex.org/W2116546045","https://openalex.org/W2117029426","https://openalex.org/W2124535811","https://openalex.org/W2142232938","https://openalex.org/W2147673046","https://openalex.org/W2147871138","https://openalex.org/W2160566140","https://openalex.org/W2165137454","https://openalex.org/W2168351399","https://openalex.org/W2176633010","https://openalex.org/W4246930083","https://openalex.org/W6637186441","https://openalex.org/W6684422997"],"related_works":["https://openalex.org/W2271369634","https://openalex.org/W2350550760","https://openalex.org/W578794879","https://openalex.org/W2625296515","https://openalex.org/W3137890128","https://openalex.org/W1984634519","https://openalex.org/W4245955731","https://openalex.org/W2393726419","https://openalex.org/W2380912101","https://openalex.org/W2801048620"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,32,76],"not":[4],"only":[5],"developed":[6],"a":[7,23,28,34,52],"reliable":[8],"sound":[9],"localization":[10,50],"system":[11,26,83,102],"including":[12],"VAD":[13],"(voice":[14],"activity":[15],"detection)":[16],"component":[17],"using":[18,27],"three":[19],"microphones":[20],"but":[21],"also":[22],"face":[24],"tracking":[25],"vision":[29,82],"camera.":[30],"Moreover,":[31],"proposed":[33,79],"way":[35],"to":[36,44,55,84,98],"integrate":[37,99],"these":[38],"systems":[39],"in":[40,48],"the":[41,46,49,64,69,78,85],"human-robot":[42],"interaction":[43],"compensate":[45],"errors":[47],"of":[51,71],"speaker":[53],"and":[54,81,95],"reject":[56],"unnecessary":[57],"speech":[58],"or":[59],"noise":[60],"signals":[61],"entering":[62],"from":[63],"undesired":[65],"directions":[66],"effectively.":[67],"For":[68],"purpose":[70],"verifying":[72],"our":[73],"system's":[74],"performances,":[75],"installed":[77],"audition":[80],"prototype":[86],"robot,":[87],"called":[88],"IROBAA":[89],"(Intelligent":[90],"ROBot":[91],"for":[92],"Active":[93],"Audition),":[94],"showed":[96],"how":[97],"an":[100],"audio-visual":[101]},"counts_by_year":[{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
