{"id":"https://openalex.org/W2504454573","doi":"https://doi.org/10.1109/iros.2016.7759437","title":"Reverberant sound localization with a robot head based on direct-path relative transfer function","display_name":"Reverberant sound localization with a robot head based on direct-path relative transfer function","publication_year":2016,"publication_date":"2016-10-01","ids":{"openalex":"https://openalex.org/W2504454573","doi":"https://doi.org/10.1109/iros.2016.7759437","mag":"2504454573"},"language":"en","primary_location":{"id":"doi:10.1109/iros.2016.7759437","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2016.7759437","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2012.03574","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Xiaofei Li","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Xiaofei Li","raw_affiliation_strings":["INRIA Grenoble Rhone-Alpes"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Grenoble Rhone-Alpes","institution_ids":["https://openalex.org/I1326498283"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Laurent Girin","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I4210124956","display_name":"GIPSA-Lab","ror":"https://ror.org/02wrme198","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I4210124956","https://openalex.org/I899635006","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Laurent Girin","raw_affiliation_strings":["GIPSA-LAB","INRIA Grenoble Rhone-Alpes","Univ. Grenoble Alpes"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"GIPSA-LAB","institution_ids":["https://openalex.org/I4210124956"]},{"raw_affiliation_string":"INRIA Grenoble Rhone-Alpes","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Univ. Grenoble Alpes","institution_ids":["https://openalex.org/I899635006"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fabien Badeig","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Fabien Badeig","raw_affiliation_strings":["INRIA Grenoble Rhone-Alpes"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Grenoble Rhone-Alpes","institution_ids":["https://openalex.org/I1326498283"]}]},{"author_position":"last","author":{"id":null,"display_name":"Radu Horaud","orcid":null},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Radu Horaud","raw_affiliation_strings":["INRIA Grenoble Rhone-Alpes"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"INRIA Grenoble Rhone-Alpes","institution_ids":["https://openalex.org/I1326498283"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.2763,"has_fulltext":false,"cited_by_count":27,"citation_normalized_percentile":{"value":0.80967458,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2819","last_page":"2826"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10822","display_name":"Acoustic Wave Phenomena Research","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transfer-function","display_name":"Transfer function","score":0.6996999979019165},{"id":"https://openalex.org/keywords/impulse-response","display_name":"Impulse response","score":0.6237000226974487},{"id":"https://openalex.org/keywords/microphone","display_name":"Microphone","score":0.5895000100135803},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.5511999726295471},{"id":"https://openalex.org/keywords/microphone-array","display_name":"Microphone array","score":0.421099990606308},{"id":"https://openalex.org/keywords/acoustic-source-localization","display_name":"Acoustic source localization","score":0.41999998688697815},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4050000011920929},{"id":"https://openalex.org/keywords/head-related-transfer-function","display_name":"Head-related transfer function","score":0.40049999952316284},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.3894999921321869},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.3813999891281128}],"concepts":[{"id":"https://openalex.org/C81299745","wikidata":"https://www.wikidata.org/wiki/Q334269","display_name":"Transfer function","level":2,"score":0.6996999979019165},{"id":"https://openalex.org/C72279823","wikidata":"https://www.wikidata.org/wiki/Q1139726","display_name":"Impulse response","level":2,"score":0.6237000226974487},{"id":"https://openalex.org/C2778263558","wikidata":"https://www.wikidata.org/wiki/Q46384","display_name":"Microphone","level":3,"score":0.5895000100135803},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.5511999726295471},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5220000147819519},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.49639999866485596},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.489300012588501},{"id":"https://openalex.org/C2778806681","wikidata":"https://www.wikidata.org/wiki/Q907293","display_name":"Microphone array","level":4,"score":0.421099990606308},{"id":"https://openalex.org/C93240960","wikidata":"https://www.wikidata.org/wiki/Q217270","display_name":"Acoustic source localization","level":3,"score":0.41999998688697815},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4050000011920929},{"id":"https://openalex.org/C151382886","wikidata":"https://www.wikidata.org/wiki/Q1432854","display_name":"Head-related transfer function","level":3,"score":0.40049999952316284},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.3894999921321869},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.3813999891281128},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.38109999895095825},{"id":"https://openalex.org/C168110828","wikidata":"https://www.wikidata.org/wiki/Q1331626","display_name":"Spectral density","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.35600000619888306},{"id":"https://openalex.org/C2778067643","wikidata":"https://www.wikidata.org/wiki/Q166507","display_name":"Interval (graph theory)","level":2,"score":0.35510000586509705},{"id":"https://openalex.org/C8590192","wikidata":"https://www.wikidata.org/wiki/Q1054694","display_name":"Frequency response","level":2,"score":0.35179999470710754},{"id":"https://openalex.org/C197055811","wikidata":"https://www.wikidata.org/wiki/Q207522","display_name":"Probability density function","level":2,"score":0.349700003862381},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33820000290870667},{"id":"https://openalex.org/C70836080","wikidata":"https://www.wikidata.org/wiki/Q837940","display_name":"Impulse (physics)","level":2,"score":0.33640000224113464},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.33000001311302185},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3296000063419342},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.32190001010894775},{"id":"https://openalex.org/C54926389","wikidata":"https://www.wikidata.org/wiki/Q7575188","display_name":"Spectral envelope","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.3095000088214874},{"id":"https://openalex.org/C166386157","wikidata":"https://www.wikidata.org/wiki/Q1477735","display_name":"Short-time Fourier transform","level":4,"score":0.29789999127388},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C100675267","wikidata":"https://www.wikidata.org/wiki/Q1371624","display_name":"Background noise","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C175231954","wikidata":"https://www.wikidata.org/wiki/Q1942321","display_name":"Optical transfer function","level":2,"score":0.25380000472068787},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iros.2016.7759437","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2016.7759437","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2012.03574","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2012.03574","pdf_url":"https://arxiv.org/pdf/2012.03574","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:HAL:hal-01349771v1","is_oa":false,"landing_page_url":"https://inria.hal.science/hal-01349771","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.iros2016.org/","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2012.03574","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2012.03574","pdf_url":"https://arxiv.org/pdf/2012.03574","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1552633171","https://openalex.org/W1555217905","https://openalex.org/W1608607476","https://openalex.org/W1964998538","https://openalex.org/W1966081805","https://openalex.org/W1981463705","https://openalex.org/W2019231209","https://openalex.org/W2025127228","https://openalex.org/W2050551142","https://openalex.org/W2063521662","https://openalex.org/W2069885239","https://openalex.org/W2084637638","https://openalex.org/W2090024980","https://openalex.org/W2093010905","https://openalex.org/W2115969105","https://openalex.org/W2126341088","https://openalex.org/W2126942983","https://openalex.org/W2128970593","https://openalex.org/W2130357996","https://openalex.org/W2130642871","https://openalex.org/W2131968171","https://openalex.org/W2137666850","https://openalex.org/W2139129402","https://openalex.org/W2147665979","https://openalex.org/W2153248083","https://openalex.org/W2155323221","https://openalex.org/W2156676906","https://openalex.org/W2166682639","https://openalex.org/W2171355909","https://openalex.org/W2204714259","https://openalex.org/W2295648723","https://openalex.org/W6638560928"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"addresses":[2],"the":[3,43,51,73,76,83,100,108,115,126,130,134,138,144,150,173,183,194,197,223],"problem":[4],"of":[5,32,50,82,129,137,143,167,178],"sound-source":[6],"localization":[7],"(SSL)":[8],"with":[9,213],"a":[10,15,48,96,165,207,214],"robot":[11],"head,":[12],"which":[13,182],"remains":[14],"challenge":[16],"in":[17,25,107,181,217],"real-world":[18],"environments.":[19],"In":[20,54],"particular":[21],"we":[22],"are":[23,31,159,200],"interested":[24],"locating":[26],"speech":[27,152,174],"sources,":[28],"as":[29,72,206],"they":[30],"high":[33],"interest":[34],"for":[35,92,210],"human-robot":[36],"interaction.":[37],"The":[38,64],"microphone-pair":[39],"response":[40,57,128],"corresponding":[41],"to":[42,98,123],"direct-path":[44,65,77,145],"sound":[45],"propagation":[46],"is":[47,58,70,88,121,140,170,185,190],"function":[49,68,80,118],"source":[52],"direction.":[53],"practice,":[55],"this":[56],"contaminated":[59],"by":[60,161,172,192],"noise":[61],"and":[62,86,104,133,154,176,189,204],"reverberations.":[63],"relative":[66],"transfer":[67,79,117],"(DP-RTF)":[69],"defined":[71],"ratio":[74],"between":[75],"acoustic":[78],"(ATF)":[81],"two":[84,227],"microphones,":[85],"it":[87],"an":[89,186],"important":[90],"feature":[91,208],"SSL.":[93,211],"We":[94],"propose":[95],"method":[97,225],"estimate":[99],"DP-RTF":[101,184],"from":[102],"noisy":[103],"reverberant":[105,219],"signals":[106],"short-time":[109],"Fourier":[110],"transform":[111],"(STFT)":[112],"domain.":[113],"First,":[114],"convolutive":[116],"(CTF)":[119],"approximation":[120],"adopted":[122],"accurately":[124],"represent":[125],"impulse":[127],"microphone":[131],"array,":[132],"first":[135],"coefficient":[136],"CTF":[139],"mainly":[141],"composed":[142],"ATF.":[146],"At":[147],"each":[148],"frequency,":[149],"frame-wise":[151],"auto-":[153,175],"cross-power":[155],"spectral":[156,162],"density":[157],"(PSD)":[158],"obtained":[160],"subtraction.":[163],"Then":[164],"set":[166],"linear":[168],"equations":[169],"constructed":[171],"cross-PSD":[177],"multiple":[179],"frames,":[180],"unknown":[187],"variable,":[188],"estimated":[191,198],"solving":[193],"equations.":[195],"Finally,":[196],"DP-RTFs":[199],"concatenated":[201],"across":[202],"frequencies":[203],"used":[205],"vector":[209],"Experiments":[212],"robot,":[215],"placed":[216],"various":[218],"environments,":[220],"show":[221],"that":[222],"proposed":[224],"outperforms":[226],"state-of-the-art":[228],"methods.":[229]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2016-08-23T00:00:00"}
