{"id":"https://openalex.org/W2795648103","doi":"https://doi.org/10.1109/devlrn.2017.8329802","title":"Comparative study of feature extraction methods for direct word discovery with NPB-DAA from natural speech signals","display_name":"Comparative study of feature extraction methods for direct word discovery with NPB-DAA from natural speech signals","publication_year":2017,"publication_date":"2017-09-01","ids":{"openalex":"https://openalex.org/W2795648103","doi":"https://doi.org/10.1109/devlrn.2017.8329802","mag":"2795648103"},"language":"en","primary_location":{"id":"doi:10.1109/devlrn.2017.8329802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/devlrn.2017.8329802","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 Joint IEEE International Conference on Development and Learning and Epigenetic Robotics (ICDL-EpiRob)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101016762","display_name":"Yuki Tada","orcid":null},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yuki Tada","raw_affiliation_strings":["Graduate School of Information Science and Engineering, Ritsumeikan University, Kusatsu, Shiga, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Engineering, Ritsumeikan University, Kusatsu, Shiga, Japan","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064096346","display_name":"Yoshinobu Hagiwara","orcid":"https://orcid.org/0009-0006-1208-3159"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yoshinobu Hagiwara","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University, Kusatsu, Shiga, Japan"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University, Kusatsu, Shiga, Japan","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023160093","display_name":"Tadahiro Taniguchi","orcid":"https://orcid.org/0000-0002-5682-2076"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tadahiro Taniguchi","raw_affiliation_strings":["College of Information Science and Engineering, Ritsumeikan University, Kusatsu, Shiga, Japan"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ritsumeikan University, Kusatsu, Shiga, Japan","institution_ids":["https://openalex.org/I135768898"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101016762"],"corresponding_institution_ids":["https://openalex.org/I135768898"],"apc_list":null,"apc_paid":null,"fwci":0.5851,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.77379794,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"81","issue":null,"first_page":"164","last_page":"171"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10730","display_name":"Language Development and Disorders","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8124308586120605},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6700921654701233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5926113128662109},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5403104424476624},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.5366117358207703},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.47847980260849},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.47231173515319824},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.460909903049469},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.4118584394454956},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.4100109338760376},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3856295049190521},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3225662112236023},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.31746286153793335},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.25823885202407837},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09642493724822998}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8124308586120605},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6700921654701233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5926113128662109},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5403104424476624},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.5366117358207703},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.47847980260849},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.47231173515319824},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.460909903049469},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4118584394454956},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.4100109338760376},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3856295049190521},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3225662112236023},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.31746286153793335},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.25823885202407837},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09642493724822998},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/devlrn.2017.8329802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/devlrn.2017.8329802","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 Joint IEEE International Conference on Development and Learning and Epigenetic Robotics (ICDL-EpiRob)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5699999928474426,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1567832587","https://openalex.org/W1778492285","https://openalex.org/W1922655562","https://openalex.org/W1942713348","https://openalex.org/W1976359794","https://openalex.org/W1980862600","https://openalex.org/W1994396704","https://openalex.org/W2005958977","https://openalex.org/W2033413759","https://openalex.org/W2036254915","https://openalex.org/W2058079053","https://openalex.org/W2067907977","https://openalex.org/W2091150693","https://openalex.org/W2105099419","https://openalex.org/W2107917162","https://openalex.org/W2115867364","https://openalex.org/W2121137195","https://openalex.org/W2126377586","https://openalex.org/W2132991226","https://openalex.org/W2140991203","https://openalex.org/W2142111485","https://openalex.org/W2142390309","https://openalex.org/W2147768505","https://openalex.org/W2193413348","https://openalex.org/W2220867547","https://openalex.org/W2290437651","https://openalex.org/W2335112305","https://openalex.org/W2346964103","https://openalex.org/W2407753819","https://openalex.org/W2508541768","https://openalex.org/W2949115596","https://openalex.org/W3102667484","https://openalex.org/W4234588466","https://openalex.org/W4235169531","https://openalex.org/W4237938692","https://openalex.org/W6634986005","https://openalex.org/W6640777149","https://openalex.org/W6824062597"],"related_works":["https://openalex.org/W4317383455","https://openalex.org/W2548511587","https://openalex.org/W4293232884","https://openalex.org/W2422472940","https://openalex.org/W2019475500","https://openalex.org/W2548162870","https://openalex.org/W2144773493","https://openalex.org/W2082457099","https://openalex.org/W1987021544","https://openalex.org/W2147998355"],"abstract_inverted_index":{"Human":[0],"infants":[1],"can":[2,55,86,200,221,232],"discover":[3,88],"words":[4,38,202],"directly":[5],"from":[6,41,69,93,128,150,205],"unsegmented":[7],"speech":[8,42,94,115,129,152,207],"signals":[9,43,95,116,130,208],"given":[10],"by":[11,61],"their":[12],"mothers":[13],"and":[14,26,39,66,90,167,203,229,240],"other":[15],"people":[16],"without":[17],"any":[18],"explicitly":[19],"labeled":[20],"data.":[21],"Developing":[22],"a":[23,27,52,119,137,163,168,212],"computational":[24],"model":[25],"machine":[28,82],"learning":[29,83],"method":[30,84],"that":[31,54,85,195],"enable":[32],"an":[33,46,80],"artificial":[34],"system":[35],"to":[36,211],"acquire":[37],"phonemes":[40,204],"automatically":[44,87],"is":[45,79,131],"important":[47],"challenge.":[48],"It":[49],"also":[50],"provides":[51,136],"hypothesis":[53],"explain":[56],"the":[57,123,182,224,235,238,241],"dynamic":[58,179],"process":[59],"performed":[60],"infants,":[62],"i.e.,":[63],"word":[64,146,227,245],"discovery":[65,147],"phoneme":[67],"acquisition":[68],"daily":[70],"experiences.":[71],"The":[72,192],"nonparametric":[73],"Bayesian":[74],"double":[75],"articulation":[76],"analyzer":[77],"(NPB-DAA)":[78],"unsupervised":[81],"word-like":[89],"phoneme-like":[91],"units":[92],"directly.":[96],"However,":[97],"its":[98],"performance":[99,225,242],"has":[100],"only":[101],"not":[102],"been":[103],"evaluated":[104],"using":[105],"natural":[106,114,151,206],"spoken":[107],"languages":[108],"including":[109,117],"consonants.":[110],"For":[111],"dealing":[112],"with":[113,148,173],"consonants,":[118],"comparative":[120,138],"study":[121,139],"of":[122,140,158,176,178,188,218,226,244],"methods":[124,143,161],"for":[125,144],"extracting":[126],"features":[127,180,220],"crucially":[132],"important.":[133],"This":[134],"paper":[135],"feature":[141,159],"extraction":[142,160],"direct":[145],"NPB-DAA":[149,197],"signals.":[153],"We":[154],"examined":[155],"six":[156],"types":[157,175],"employing":[162],"mel-frequency":[164],"cepstral":[165],"coefficient":[166],"deep":[169],"sparse":[170],"autoencoder":[171],"(DSAE)":[172],"several":[174],"employment":[177],"on":[181],"TIDIGITS":[183],"corpus,":[184],"which":[185],"contains":[186],"utterances":[187],"connected":[189],"digit":[190],"sequences.":[191],"results":[193],"showed":[194],"1)":[196],"with/without":[198],"DSAE":[199,231],"extract":[201],"containing":[209],"consonants":[210],"certain":[213],"extent,":[214],"2)":[215],"naive":[216],"introduction":[217],"dynamics":[219],"even":[222],"harm":[223],"discovery,":[228],"3)":[230],"consistently":[233],"increase":[234],"correlation":[236],"between":[237],"log-likelihood":[239],"measure":[243],"discovery.":[246]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
