{"id":"https://openalex.org/W2161224286","doi":"https://doi.org/10.1109/icassp.2008.4518635","title":"Hierarchical spectro-temporal features for robust speech recognition","display_name":"Hierarchical spectro-temporal features for robust speech recognition","publication_year":2008,"publication_date":"2008-03-01","ids":{"openalex":"https://openalex.org/W2161224286","doi":"https://doi.org/10.1109/icassp.2008.4518635","mag":"2161224286"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2008.4518635","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2008.4518635","pdf_url":null,"source":{"id":"https://openalex.org/S4210167542","display_name":"Proceedings of the ... IEEE International Conference on Acoustics, Speech, and Signal Processing","issn_l":"1520-6149","issn":["1520-6149","2379-190X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016992467","display_name":"Xavier Domont","orcid":null},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Xavier Domont","raw_affiliation_strings":["Control Theory and Robotics Laboratory, Technische Universit\u00e4t Darmstadt, Germany","Honda Research Institute Europe GmbH, Offenbach am Main, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Control Theory and Robotics Laboratory, Technische Universit\u00e4t Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]},{"raw_affiliation_string":"Honda Research Institute Europe GmbH, Offenbach am Main, Germany","institution_ids":["https://openalex.org/I4210112253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071842389","display_name":"Martin Heckmann","orcid":"https://orcid.org/0000-0002-1794-1160"},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Martin Heckmann","raw_affiliation_strings":["Honda Research Institute Europe GmbH, Offenbach am Main, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Honda Research Institute Europe GmbH, Offenbach am Main, Germany","institution_ids":["https://openalex.org/I4210112253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042767682","display_name":"Frank Joublin","orcid":"https://orcid.org/0000-0002-4421-1737"},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Frank Joublin","raw_affiliation_strings":["Honda Research Institute Europe GmbH, Offenbach am Main, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Honda Research Institute Europe GmbH, Offenbach am Main, Germany","institution_ids":["https://openalex.org/I4210112253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053974584","display_name":"Christian Goerick","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Christian Goerick","raw_affiliation_strings":["Honda Research Institute Europe GmbH, Offenbach am Main, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Honda Research Institute Europe GmbH, Offenbach am Main, Germany","institution_ids":["https://openalex.org/I4210112253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.175,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.92149758,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"5","issue":null,"first_page":"4417","last_page":"4420"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.8476643562316895},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7859541177749634},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7009491920471191},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.6421986818313599},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6098123788833618},{"id":"https://openalex.org/keywords/formant","display_name":"Formant","score":0.5712226629257202},{"id":"https://openalex.org/keywords/filter-bank","display_name":"Filter bank","score":0.5625567436218262},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5557634830474854},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5377761125564575},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5202276110649109},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.28875043988227844},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.2097935974597931},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.12371951341629028},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07347309589385986}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.8476643562316895},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7859541177749634},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7009491920471191},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.6421986818313599},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6098123788833618},{"id":"https://openalex.org/C158215666","wikidata":"https://www.wikidata.org/wiki/Q1414685","display_name":"Formant","level":3,"score":0.5712226629257202},{"id":"https://openalex.org/C100515483","wikidata":"https://www.wikidata.org/wiki/Q3268235","display_name":"Filter bank","level":3,"score":0.5625567436218262},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5557634830474854},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5377761125564575},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5202276110649109},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.28875043988227844},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2097935974597931},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.12371951341629028},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07347309589385986},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/icassp.2008.4518635","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2008.4518635","pdf_url":null,"source":{"id":"https://openalex.org/S4210167542","display_name":"Proceedings of the ... IEEE International Conference on Acoustics, Speech, and Signal Processing","issn_l":"1520-6149","issn":["1520-6149","2379-190X"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:aleph.bib-bvb.de:BVB01-020410303","is_oa":false,"landing_page_url":"http://bvbr.bib-bvb.de:8991/F?func=service&amp;doc_library=BVB01&amp;local_base=BVB01&amp;doc_number=020410303&amp;sequence=000001&amp;line_number=0001&amp;func_code=DB_RECORDS&amp;service_type=MEDIA","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:tubiblio.ulb.tu-darmstadt.de:42300","is_oa":false,"landing_page_url":"http://tubiblio.ulb.tu-darmstadt.de/42300/","pdf_url":null,"source":{"id":"https://openalex.org/S4377196390","display_name":"TUbilio (Technical University of Darmstadt)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I31512782","host_organization_name":"Technische Universit\u00e4t Darmstadt","host_organization_lineage":["https://openalex.org/I31512782"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Dissertation"},{"id":"pmh:oai:tubiblio.ulb.tu-darmstadt.de:43807","is_oa":false,"landing_page_url":"http://tubiblio.ulb.tu-darmstadt.de/43807/","pdf_url":null,"source":{"id":"https://openalex.org/S4377196390","display_name":"TUbilio (Technical University of Darmstadt)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I31512782","host_organization_name":"Technische Universit\u00e4t Darmstadt","host_organization_lineage":["https://openalex.org/I31512782"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Konferenzver\u00f6ffentlichung"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":113,"referenced_works":["https://openalex.org/W44505","https://openalex.org/W9692546","https://openalex.org/W82825538","https://openalex.org/W83248749","https://openalex.org/W88081813","https://openalex.org/W96378396","https://openalex.org/W107021117","https://openalex.org/W185597827","https://openalex.org/W190289757","https://openalex.org/W192024671","https://openalex.org/W204776311","https://openalex.org/W396690109","https://openalex.org/W824697508","https://openalex.org/W840994659","https://openalex.org/W1489184006","https://openalex.org/W1490917794","https://openalex.org/W1491238342","https://openalex.org/W1493163583","https://openalex.org/W1506806321","https://openalex.org/W1522045018","https://openalex.org/W1534605895","https://openalex.org/W1534876456","https://openalex.org/W1541452272","https://openalex.org/W1542901287","https://openalex.org/W1563907341","https://openalex.org/W1578856370","https://openalex.org/W1648222827","https://openalex.org/W1663973292","https://openalex.org/W1902027874","https://openalex.org/W1907246751","https://openalex.org/W1926981477","https://openalex.org/W1964223780","https://openalex.org/W1966264494","https://openalex.org/W1974387177","https://openalex.org/W1977690962","https://openalex.org/W1984746632","https://openalex.org/W1987221083","https://openalex.org/W1989348468","https://openalex.org/W1992272902","https://openalex.org/W1993093115","https://openalex.org/W1999940674","https://openalex.org/W2000232298","https://openalex.org/W2000397769","https://openalex.org/W2025653905","https://openalex.org/W2036059453","https://openalex.org/W2037108510","https://openalex.org/W2043567784","https://openalex.org/W2047769394","https://openalex.org/W2050758723","https://openalex.org/W2054139811","https://openalex.org/W2061659108","https://openalex.org/W2066218102","https://openalex.org/W2069976350","https://openalex.org/W2070464324","https://openalex.org/W2071489795","https://openalex.org/W2074354966","https://openalex.org/W2090453668","https://openalex.org/W2090861223","https://openalex.org/W2093283533","https://openalex.org/W2095913425","https://openalex.org/W2096391593","https://openalex.org/W2099741732","https://openalex.org/W2101596234","https://openalex.org/W2102248717","https://openalex.org/W2102512139","https://openalex.org/W2103328846","https://openalex.org/W2104263267","https://openalex.org/W2106156162","https://openalex.org/W2107223151","https://openalex.org/W2110063971","https://openalex.org/W2112638956","https://openalex.org/W2113872551","https://openalex.org/W2118718620","https://openalex.org/W2121137195","https://openalex.org/W2122111406","https://openalex.org/W2122832694","https://openalex.org/W2125838338","https://openalex.org/W2128705673","https://openalex.org/W2129901640","https://openalex.org/W2130426352","https://openalex.org/W2137075158","https://openalex.org/W2137234026","https://openalex.org/W2139737683","https://openalex.org/W2141224535","https://openalex.org/W2144600569","https://openalex.org/W2144636407","https://openalex.org/W2145889472","https://openalex.org/W2146324387","https://openalex.org/W2147119735","https://openalex.org/W2148154194","https://openalex.org/W2149194912","https://openalex.org/W2151484683","https://openalex.org/W2151802380","https://openalex.org/W2152131029","https://openalex.org/W2152483743","https://openalex.org/W2158239695","https://openalex.org/W2158547396","https://openalex.org/W2163680580","https://openalex.org/W2165712214","https://openalex.org/W2166676140","https://openalex.org/W2167200294","https://openalex.org/W2167753501","https://openalex.org/W2266266311","https://openalex.org/W2395865858","https://openalex.org/W2403141126","https://openalex.org/W2541843830","https://openalex.org/W2542469892","https://openalex.org/W2738048707","https://openalex.org/W3143596294","https://openalex.org/W4285719527","https://openalex.org/W6613520308","https://openalex.org/W6677759377","https://openalex.org/W6712026950"],"related_works":["https://openalex.org/W2025848302","https://openalex.org/W1975454382","https://openalex.org/W2799441357","https://openalex.org/W5449343","https://openalex.org/W2409530148","https://openalex.org/W2053642297","https://openalex.org/W4250508028","https://openalex.org/W4403337003","https://openalex.org/W2070513494","https://openalex.org/W2546026986"],"abstract_inverted_index":{"Previously":[0],"we":[1,23,46],"presented":[2],"an":[3],"auditory-inspired":[4],"feed-forward":[5],"architecture":[6],"which":[7,66,86],"achieves":[8],"good":[9],"performance":[10],"in":[11,125],"noisy":[12],"conditions":[13],"on":[14,104],"a":[15,27,52,105],"segmented":[16],"word":[17],"recognition":[18,108,123],"task.":[19,109],"In":[20],"this":[21,31],"paper":[22],"propose":[24],"to":[25,34,61,83],"use":[26],"modified":[28],"version":[29],"of":[30,77],"hierarchical":[32],"model":[33],"generate":[35],"features":[36,45,85,100,120],"for":[37],"standard":[38],"hidden":[39],"Markov":[40],"models.":[41],"To":[42],"obtain":[43],"these":[44],"firstly":[47],"compute":[48],"the":[49,58,63,75,78,88],"spectrograms":[50],"using":[51,70],"Gammatone":[53],"filterbank.":[54],"A":[55],"filtering":[56],"over":[57,94],"channels":[59],"permits":[60],"enhance":[62],"formant":[64],"frequencies":[65],"are":[67,81],"afterwards":[68],"detected":[69],"Gabor-like":[71],"receptive":[72,79],"fields.":[73],"Then":[74],"responses":[76],"fields":[80],"combined":[82],"complex":[84],"span":[87],"whole":[89],"frequency":[90],"range":[91],"and":[92],"extend":[93],"three":[95],"different":[96],"time":[97],"windows.":[98],"The":[99,110],"have":[101],"been":[102],"evaluated":[103],"single":[106],"digit":[107],"results":[111],"show":[112],"that":[113],"their":[114],"combination":[115],"with":[116],"MFCCs":[117],"or":[118],"RASTA":[119],"yields":[121],"improved":[122],"scores":[124],"noise.":[126]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
