{"id":"https://openalex.org/W2030348640","doi":"https://doi.org/10.1109/wiamis.2013.6616122","title":"Robust spectro-temporal speech features with model-based distribution equalization","display_name":"Robust spectro-temporal speech features with model-based distribution equalization","publication_year":2013,"publication_date":"2013-07-01","ids":{"openalex":"https://openalex.org/W2030348640","doi":"https://doi.org/10.1109/wiamis.2013.6616122","mag":"2030348640"},"language":"en","primary_location":{"id":"doi:10.1109/wiamis.2013.6616122","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wiamis.2013.6616122","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 14th International Workshop on Image Analysis for Multimedia Interactive Services (WIAMIS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015154305","display_name":"Samuel K. Ngouoko M","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]},{"id":"https://openalex.org/I20121455","display_name":"Bielefeld University","ror":"https://ror.org/02hpadn98","country_code":"DE","type":"education","lineage":["https://openalex.org/I20121455"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Samuel K. Ngouoko M","raw_affiliation_strings":["Honda Research Institute GmbH, Germany","Research Institute for Cognition and Robotics, Bielefeld University, Bielefeld, Germany"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute GmbH, Germany","institution_ids":["https://openalex.org/I4210112253"]},{"raw_affiliation_string":"Research Institute for Cognition and Robotics, Bielefeld University, Bielefeld, Germany","institution_ids":["https://openalex.org/I20121455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071842389","display_name":"Martin Heckmann","orcid":"https://orcid.org/0000-0002-1794-1160"},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Martin Heckmann","raw_affiliation_strings":["Honda Research Institute GmbH, Germany"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute GmbH, Germany","institution_ids":["https://openalex.org/I4210112253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067961454","display_name":"Britta Wrede","orcid":"https://orcid.org/0000-0003-1424-472X"},"institutions":[{"id":"https://openalex.org/I20121455","display_name":"Bielefeld University","ror":"https://ror.org/02hpadn98","country_code":"DE","type":"education","lineage":["https://openalex.org/I20121455"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Britta Wrede","raw_affiliation_strings":["Research Institute for Cognition and Robotics, Bielefeld University, Bielefeld, Germany"],"affiliations":[{"raw_affiliation_string":"Research Institute for Cognition and Robotics, Bielefeld University, Bielefeld, Germany","institution_ids":["https://openalex.org/I20121455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5015154305"],"corresponding_institution_ids":["https://openalex.org/I20121455","https://openalex.org/I4210112253"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08484233,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"5","issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/histogram","display_name":"Histogram","score":0.7153465151786804},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6411711573600769},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6036224365234375},{"id":"https://openalex.org/keywords/equalization","display_name":"Equalization (audio)","score":0.5882030129432678},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5832663774490356},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.5770478248596191},{"id":"https://openalex.org/keywords/histogram-equalization","display_name":"Histogram equalization","score":0.5189828276634216},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4907113313674927},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4876598119735718},{"id":"https://openalex.org/keywords/distribution","display_name":"Distribution (mathematics)","score":0.47918713092803955},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4393157958984375},{"id":"https://openalex.org/keywords/parametric-model","display_name":"Parametric model","score":0.4234023690223694},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4210270643234253},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.26488688588142395},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.25001242756843567},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13471350073814392},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.07305523753166199},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.07248532772064209}],"concepts":[{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.7153465151786804},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6411711573600769},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6036224365234375},{"id":"https://openalex.org/C75755367","wikidata":"https://www.wikidata.org/wiki/Q104531076","display_name":"Equalization (audio)","level":3,"score":0.5882030129432678},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5832663774490356},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.5770478248596191},{"id":"https://openalex.org/C136943445","wikidata":"https://www.wikidata.org/wiki/Q1970240","display_name":"Histogram equalization","level":4,"score":0.5189828276634216},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4907113313674927},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4876598119735718},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.47918713092803955},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4393157958984375},{"id":"https://openalex.org/C24574437","wikidata":"https://www.wikidata.org/wiki/Q7135228","display_name":"Parametric model","level":3,"score":0.4234023690223694},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4210270643234253},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26488688588142395},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.25001242756843567},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13471350073814392},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.07305523753166199},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.07248532772064209},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/wiamis.2013.6616122","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wiamis.2013.6616122","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 14th International Workshop on Image Analysis for Multimedia Interactive Services (WIAMIS)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.645.2145","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.645.2145","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://home.arcor.de/martin.heckmann/Publications/2013/Ngouoko-WIAMIS13.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W34609997","https://openalex.org/W88081813","https://openalex.org/W396690109","https://openalex.org/W1970606596","https://openalex.org/W1974387177","https://openalex.org/W1985710418","https://openalex.org/W1990934990","https://openalex.org/W2088489891","https://openalex.org/W2099741732","https://openalex.org/W2118718620","https://openalex.org/W2137075158","https://openalex.org/W2151484683","https://openalex.org/W2152131029","https://openalex.org/W2161224286","https://openalex.org/W2163680580","https://openalex.org/W2166676140","https://openalex.org/W2171000037","https://openalex.org/W2399455627","https://openalex.org/W2574153265","https://openalex.org/W4245289321","https://openalex.org/W6613520308"],"related_works":["https://openalex.org/W2057981026","https://openalex.org/W2256021896","https://openalex.org/W2181573213","https://openalex.org/W2398368608","https://openalex.org/W1990492110","https://openalex.org/W1583737874","https://openalex.org/W2122866860","https://openalex.org/W2024449420","https://openalex.org/W2903465195","https://openalex.org/W2380937280"],"abstract_inverted_index":{"Previously,":[0],"we":[1,32,72,132],"applied":[2],"a":[3,23,51,74,109,165],"distribution":[4,40,53,75,111,156,167],"equalization":[5,76,112,157],"on":[6,78,134,144],"our":[7,88],"HIerarchical":[8],"Spectro-Temporal":[9],"(HIST)":[10],"features":[11,100,106,131,142],"using":[12,117],"distributions":[13],"estimated":[14,80],"from":[15,42,54,160],"histogram":[16,162],"of":[17,63,87,97,103],"one":[18,43,136],"or":[19],"several":[20],"utterances.":[21],"Although":[22],"performance":[24,35,96,139,149],"increase":[25],"could":[26],"be":[27],"observed":[28,66],"in":[29],"both":[30],"cases,":[31],"noticed":[33],"low":[34],"improvement":[36],"when":[37,108],"estimating":[38],"the":[39,60,65,79,95,98,118,127,135,145,151,161],"only":[41],"utterance.":[44],"The":[45],"aim":[46],"here":[47],"is":[48],"to":[49],"determine":[50],"parametric":[52,166],"few":[55],"data":[56,67],"samples":[57],"which":[58],"gives":[59],"highest":[61],"probability":[62],"producing":[64],"considering":[68],"different":[69,122],"models.":[70],"Afterwards,":[71],"perform":[73],"based":[77],"model":[81],"after":[82],"each":[83],"feature":[84,90,153],"extraction":[85,91],"step":[86],"HIST":[89,99,128],"framework.":[92],"We":[93],"compare":[94],"with":[101,155],"those":[102],"conventional":[104],"spectral":[105,141],"(RASTA-PLP),":[107,143],"corresponding":[110],"has":[113],"been":[114],"carried":[115],"out":[116],"TIDigits":[119],"database":[120],"and":[121,129],"noise":[123],"types.":[124],"By":[125],"combining":[126],"RASTA-PLP":[130],"achieved":[133],"hand":[137,147],"better":[138,148],"than":[140,150],"other":[146],"same":[152],"combination":[154],"obtained":[158],"directly":[159],"without":[163],"imposing":[164],"model.":[168]},"counts_by_year":[],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
