{"id":"https://openalex.org/W1988175918","doi":"https://doi.org/10.2478/s13230-010-0005-1","title":"Soft missing-feature mask generation for Robot Audition","display_name":"Soft missing-feature mask generation for Robot Audition","publication_year":2010,"publication_date":"2010-03-01","ids":{"openalex":"https://openalex.org/W1988175918","doi":"https://doi.org/10.2478/s13230-010-0005-1","mag":"1988175918"},"language":"en","primary_location":{"id":"doi:10.2478/s13230-010-0005-1","is_oa":true,"landing_page_url":"https://doi.org/10.2478/s13230-010-0005-1","pdf_url":"https://www.degruyter.com/document/doi/10.2478/s13230-010-0005-1/pdf","source":{"id":"https://openalex.org/S4210226531","display_name":"Paladyn Journal of Behavioral Robotics","issn_l":"2081-4836","issn":["2081-4836"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320322","host_organization_name":"De Gruyter Open","host_organization_lineage":["https://openalex.org/P4310320322","https://openalex.org/P4310313990"],"host_organization_lineage_names":["De Gruyter Open","De Gruyter"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Paladyn, Journal of Behavioral Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.degruyter.com/document/doi/10.2478/s13230-010-0005-1/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065967819","display_name":"T\u00f4ru Takahashi","orcid":"https://orcid.org/0000-0002-8476-9751"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Toru Takahashi","raw_affiliation_strings":["Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091708408","display_name":"Kazuhiro Nakadai","orcid":"https://orcid.org/0000-0002-6134-4558"},"institutions":[{"id":"https://openalex.org/I1283473643","display_name":"Honda (Japan)","ror":"https://ror.org/03jzay846","country_code":"JP","type":"company","lineage":["https://openalex.org/I1283473643"]},{"id":"https://openalex.org/I114531698","display_name":"Tokyo Institute of Technology","ror":"https://ror.org/0112mx960","country_code":"JP","type":"education","lineage":["https://openalex.org/I114531698"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazuhiro Nakadai","raw_affiliation_strings":["Honda Research Institute Japan Co., Ltd., 8-1 Honcho, Wako, Saitama 351-0114, Japan","Mechanical and Environmental Informatics, Graduate School of Information Science and Engineering, Tokyo Institute of Technology, Tokyo, 152-8552, Japan"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute Japan Co., Ltd., 8-1 Honcho, Wako, Saitama 351-0114, Japan","institution_ids":["https://openalex.org/I1283473643"]},{"raw_affiliation_string":"Mechanical and Environmental Informatics, Graduate School of Information Science and Engineering, Tokyo Institute of Technology, Tokyo, 152-8552, Japan","institution_ids":["https://openalex.org/I114531698"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049614400","display_name":"Kazunori Komatani","orcid":"https://orcid.org/0000-0002-6052-600X"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazunori Komatani","raw_affiliation_strings":["Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055922202","display_name":"Tetsuya Ogata","orcid":"https://orcid.org/0000-0001-7015-0379"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsuya Ogata","raw_affiliation_strings":["Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005141184","display_name":"Hiroshi G. Okuno","orcid":"https://orcid.org/0000-0002-8704-4318"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hiroshi G. Okuno","raw_affiliation_strings":["Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Intelligence and Science and Technology, Graduate School of Informatics, Kyoto University, Kyoto 606-8501, Japan","institution_ids":["https://openalex.org/I22299242"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5065967819"],"corresponding_institution_ids":["https://openalex.org/I22299242"],"apc_list":{"value":1000,"currency":"EUR","value_usd":1078},"apc_paid":{"value":1000,"currency":"EUR","value_usd":1078},"fwci":0.3371,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53832188,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"1","issue":"1","first_page":"37","last_page":"47"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7458896040916443},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.599671483039856},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5563035607337952},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5464568734169006},{"id":"https://openalex.org/keywords/sigmoid-function","display_name":"Sigmoid function","score":0.4960494935512543},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4671807885169983},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3934501111507416},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.14592254161834717}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7458896040916443},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.599671483039856},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5563035607337952},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5464568734169006},{"id":"https://openalex.org/C81388566","wikidata":"https://www.wikidata.org/wiki/Q526668","display_name":"Sigmoid function","level":3,"score":0.4960494935512543},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4671807885169983},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3934501111507416},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.14592254161834717},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.2478/s13230-010-0005-1","is_oa":true,"landing_page_url":"https://doi.org/10.2478/s13230-010-0005-1","pdf_url":"https://www.degruyter.com/document/doi/10.2478/s13230-010-0005-1/pdf","source":{"id":"https://openalex.org/S4210226531","display_name":"Paladyn Journal of Behavioral Robotics","issn_l":"2081-4836","issn":["2081-4836"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320322","host_organization_name":"De Gruyter Open","host_organization_lineage":["https://openalex.org/P4310320322","https://openalex.org/P4310313990"],"host_organization_lineage_names":["De Gruyter Open","De Gruyter"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Paladyn, Journal of Behavioral Robotics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:fd8c3fada5e24607aae0818fdd454fe9","is_oa":true,"landing_page_url":"https://doaj.org/article/fd8c3fada5e24607aae0818fdd454fe9","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Paladyn, Vol 1, Iss 1, Pp 37-47 (2010)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.2478/s13230-010-0005-1","is_oa":true,"landing_page_url":"https://doi.org/10.2478/s13230-010-0005-1","pdf_url":"https://www.degruyter.com/document/doi/10.2478/s13230-010-0005-1/pdf","source":{"id":"https://openalex.org/S4210226531","display_name":"Paladyn Journal of Behavioral Robotics","issn_l":"2081-4836","issn":["2081-4836"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320322","host_organization_name":"De Gruyter Open","host_organization_lineage":["https://openalex.org/P4310320322","https://openalex.org/P4310313990"],"host_organization_lineage_names":["De Gruyter Open","De Gruyter"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Paladyn, Journal of Behavioral Robotics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5600000023841858,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1988175918.pdf","grobid_xml":"https://content.openalex.org/works/W1988175918.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W5151113","https://openalex.org/W70999531","https://openalex.org/W75153181","https://openalex.org/W130449084","https://openalex.org/W289804034","https://openalex.org/W1498433797","https://openalex.org/W1552377494","https://openalex.org/W1881865575","https://openalex.org/W1888374534","https://openalex.org/W1994407899","https://openalex.org/W1996255164","https://openalex.org/W2026257980","https://openalex.org/W2031358052","https://openalex.org/W2049737414","https://openalex.org/W2074354966","https://openalex.org/W2075360134","https://openalex.org/W2084533374","https://openalex.org/W2093010905","https://openalex.org/W2100820878","https://openalex.org/W2110460752","https://openalex.org/W2121065047","https://openalex.org/W2121715942","https://openalex.org/W2121973264","https://openalex.org/W2126605958","https://openalex.org/W2126942983","https://openalex.org/W2126969072","https://openalex.org/W2128202590","https://openalex.org/W2134910060","https://openalex.org/W2146083413","https://openalex.org/W2147673046","https://openalex.org/W2148719987","https://openalex.org/W2149527779","https://openalex.org/W2150866759","https://openalex.org/W2160569100","https://openalex.org/W2163235592","https://openalex.org/W2319855873","https://openalex.org/W2397840473","https://openalex.org/W3146426688","https://openalex.org/W3147539069","https://openalex.org/W4301659242","https://openalex.org/W6678139903","https://openalex.org/W6683812780"],"related_works":["https://openalex.org/W4385957115","https://openalex.org/W2061372042","https://openalex.org/W3047779762","https://openalex.org/W1520030019","https://openalex.org/W2071654592","https://openalex.org/W2088157920","https://openalex.org/W2163401555","https://openalex.org/W3104477175","https://openalex.org/W2019022049","https://openalex.org/W4283785902"],"abstract_inverted_index":{"Abstract":[0],"This":[1],"paper":[2],"describes":[3],"an":[4,33,50],"improvement":[5],"in":[6,146],"automatic":[7],"speech":[8],"recognition":[9],"(ASR)":[10],"for":[11,125],"robot":[12,131],"audition":[13,132],"by":[14,171],"introducing":[15],"Missing":[16],"Feature":[17],"Theory":[18],"(MFT)":[19],"based":[20,79,114],"on":[21,80,115],"soft":[22,104,139,173],"missing":[23],"feature":[24],"masks":[25],"(MFM)":[26],"to":[27,53,63,70,93,101,112,168],"realize":[28],"natural":[29],"human-robot":[30,153],"interaction.":[31],"In":[32,151],"everyday":[34],"environment,":[35],"a":[36,98,116,142,152],"robot\u2019s":[37],"microphones":[38],"capture":[39],"various":[40],"sounds":[41],"besides":[42],"the":[43,55,81,89,94,138,156],"user\u2019s":[44,56],"utterances.":[45,150],"Although":[46],"sound-source":[47],"separation":[48],"is":[49,68],"effective":[51],"way":[52],"enhance":[54],"utterances,":[57],"it":[58],"inevitably":[59],"produces":[60],"errors":[61],"due":[62],"reflection":[64],"and":[65],"reverberation.":[66],"MFT":[67],"able":[69],"cope":[71],"with":[72],"these":[73],"errors.":[74],"First,":[75],"MFMs":[76],"are":[77],"generated":[78],"reliability":[82],"of":[83,107],"time-frequency":[84,90],"components.":[85],"Then":[86],"ASR":[87],"weighs":[88],"components":[91],"according":[92],"MFMs.":[95,174],"We":[96],"propose":[97],"new":[99],"method":[100],"automatically":[102],"generate":[103],"MFMs,":[105],"consisting":[106],"continuous":[108],"values":[109],"from":[110,165],"0":[111],"1":[113],"sigmoid":[117],"function.":[118],"The":[119],"proposed":[120],"MFM":[121,140,145],"generation":[122],"was":[123],"implemented":[124],"HRP-2":[126],"using":[127,172],"HARK,":[128],"our":[129],"open-sourced":[130],"software.":[133],"Preliminary":[134],"results":[135],"show":[136],"that":[137],"outperformed":[141],"hard":[143],"(binary)":[144],"recognizing":[147],"three":[148],"simultaneous":[149],"interaction":[154],"task,":[155],"interval":[157],"limitations":[158],"between":[159],"two":[160],"adjacent":[161],"loudspeakers":[162],"were":[163],"reduced":[164],"60":[166],"degrees":[167,170],"30":[169]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
