{"id":"https://openalex.org/W2066674745","doi":"https://doi.org/10.1109/taslp.2013.2292362","title":"A MAP-based Online Estimation Approach to Ensemble Speaker and Speaking Environment Modeling","display_name":"A MAP-based Online Estimation Approach to Ensemble Speaker and Speaking Environment Modeling","publication_year":2014,"publication_date":"2014-01-06","ids":{"openalex":"https://openalex.org/W2066674745","doi":"https://doi.org/10.1109/taslp.2013.2292362","mag":"2066674745"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2013.2292362","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2013.2292362","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044008055","display_name":"Yu Tsao","orcid":"https://orcid.org/0000-0001-6956-0418"},"institutions":[{"id":"https://openalex.org/I4210086894","display_name":"Research Center for Information Technology Innovation, Academia Sinica","ror":"https://ror.org/000zgvm20","country_code":"TW","type":"facility","lineage":["https://openalex.org/I4210086894","https://openalex.org/I84653119"]},{"id":"https://openalex.org/I29955533","display_name":"Center for Information Technology","ror":"https://ror.org/03jh5a977","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I29955533"]}],"countries":["TW","US"],"is_corresponding":true,"raw_author_name":"Yu Tsao","raw_affiliation_strings":["Research Center for Information Technology Innovation (CITI), Academia Sinica, Taipei, Taiwan","Res. Center for Inf. Technol. Innovation (CITI), Acad. Sinica, Taipei, Taiwan#TAB#"],"affiliations":[{"raw_affiliation_string":"Research Center for Information Technology Innovation (CITI), Academia Sinica, Taipei, Taiwan","institution_ids":["https://openalex.org/I4210086894"]},{"raw_affiliation_string":"Res. Center for Inf. Technol. Innovation (CITI), Acad. Sinica, Taipei, Taiwan#TAB#","institution_ids":["https://openalex.org/I29955533"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077037266","display_name":"Shigeki Matsuda","orcid":null},"institutions":[{"id":"https://openalex.org/I90023481","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349","country_code":"JP","type":"facility","lineage":["https://openalex.org/I90023481"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shigeki Matsuda","raw_affiliation_strings":["Spoken Language Communication Laboratory, National Institute of Information and Communications Technology (NICT), Kyoto, Japan","Spoken Language Commun. Lab., Nat. Inst. of Inf. & Commun. Technol. (NICT), Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Spoken Language Communication Laboratory, National Institute of Information and Communications Technology (NICT), Kyoto, Japan","institution_ids":["https://openalex.org/I90023481"]},{"raw_affiliation_string":"Spoken Language Commun. Lab., Nat. Inst. of Inf. & Commun. Technol. (NICT), Kyoto, Japan","institution_ids":["https://openalex.org/I90023481"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001601327","display_name":"Chiori Hori","orcid":"https://orcid.org/0000-0002-4201-7578"},"institutions":[{"id":"https://openalex.org/I90023481","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349","country_code":"JP","type":"facility","lineage":["https://openalex.org/I90023481"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Chiori Hori","raw_affiliation_strings":["Spoken Language Communication Laboratory, National Institute of Information and Communications Technology (NICT), Kyoto, Japan","Spoken Language Commun. Lab., Nat. Inst. of Inf. & Commun. Technol. (NICT), Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Spoken Language Communication Laboratory, National Institute of Information and Communications Technology (NICT), Kyoto, Japan","institution_ids":["https://openalex.org/I90023481"]},{"raw_affiliation_string":"Spoken Language Commun. Lab., Nat. Inst. of Inf. & Commun. Technol. (NICT), Kyoto, Japan","institution_ids":["https://openalex.org/I90023481"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108760549","display_name":"Hideki Kashioka","orcid":null},"institutions":[{"id":"https://openalex.org/I90023481","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349","country_code":"JP","type":"facility","lineage":["https://openalex.org/I90023481"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hideki Kashioka","raw_affiliation_strings":["Spoken Language Communication Laboratory, National Institute of Information and Communications Technology (NICT), Kyoto, Japan","Spoken Language Commun. Lab., Nat. Inst. of Inf. & Commun. Technol. (NICT), Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Spoken Language Communication Laboratory, National Institute of Information and Communications Technology (NICT), Kyoto, Japan","institution_ids":["https://openalex.org/I90023481"]},{"raw_affiliation_string":"Spoken Language Commun. Lab., Nat. Inst. of Inf. & Commun. Technol. (NICT), Kyoto, Japan","institution_ids":["https://openalex.org/I90023481"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066868860","display_name":"Chin\u2010Hui Lee","orcid":"https://orcid.org/0000-0002-1892-2551"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chin-Hui Lee","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology, GA, USA","Sch. of Electr. & Comput. Eng.,, Georgia Inst. of Technol., Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Sch. of Electr. & Comput. Eng.,, Georgia Inst. of Technol., Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5044008055"],"corresponding_institution_ids":["https://openalex.org/I29955533","https://openalex.org/I4210086894"],"apc_list":null,"apc_paid":null,"fwci":2.0451,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.89332458,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"22","issue":"2","first_page":"403","last_page":"416"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/maximum-a-posteriori-estimation","display_name":"Maximum a posteriori estimation","score":0.7922412753105164},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7830531597137451},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.613815188407898},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4710749685764313},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.46665215492248535},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4410228431224823},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4232833981513977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4031365215778351},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35790979862213135},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3206515312194824},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3201172947883606},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.18281584978103638},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09892064332962036},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.09176775813102722}],"concepts":[{"id":"https://openalex.org/C9810830","wikidata":"https://www.wikidata.org/wiki/Q635384","display_name":"Maximum a posteriori estimation","level":3,"score":0.7922412753105164},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7830531597137451},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.613815188407898},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4710749685764313},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.46665215492248535},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4410228431224823},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4232833981513977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4031365215778351},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35790979862213135},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3206515312194824},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3201172947883606},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.18281584978103638},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09892064332962036},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.09176775813102722},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2013.2292362","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2013.2292362","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6100000143051147,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":57,"referenced_works":["https://openalex.org/W26894416","https://openalex.org/W31925794","https://openalex.org/W117579468","https://openalex.org/W321662557","https://openalex.org/W1517348348","https://openalex.org/W1578856370","https://openalex.org/W1599512239","https://openalex.org/W2002342963","https://openalex.org/W2010023285","https://openalex.org/W2033565080","https://openalex.org/W2067117291","https://openalex.org/W2069631319","https://openalex.org/W2072009271","https://openalex.org/W2076507042","https://openalex.org/W2080921589","https://openalex.org/W2081976287","https://openalex.org/W2082474452","https://openalex.org/W2084444178","https://openalex.org/W2098692363","https://openalex.org/W2100969003","https://openalex.org/W2103537425","https://openalex.org/W2106885563","https://openalex.org/W2111093880","https://openalex.org/W2111492050","https://openalex.org/W2118329604","https://openalex.org/W2118497033","https://openalex.org/W2124338691","https://openalex.org/W2131118559","https://openalex.org/W2131708681","https://openalex.org/W2135145707","https://openalex.org/W2136386449","https://openalex.org/W2136439176","https://openalex.org/W2138534187","https://openalex.org/W2146423524","https://openalex.org/W2146871184","https://openalex.org/W2147143213","https://openalex.org/W2148694408","https://openalex.org/W2149175990","https://openalex.org/W2150907703","https://openalex.org/W2151484683","https://openalex.org/W2152131029","https://openalex.org/W2155445312","https://openalex.org/W2157178676","https://openalex.org/W2157590573","https://openalex.org/W2158289097","https://openalex.org/W2159112514","https://openalex.org/W2165053039","https://openalex.org/W2165108269","https://openalex.org/W2171892193","https://openalex.org/W2294327763","https://openalex.org/W2294690908","https://openalex.org/W4230946174","https://openalex.org/W4292023222","https://openalex.org/W6630687167","https://openalex.org/W6682194319","https://openalex.org/W6682398751","https://openalex.org/W6697419950"],"related_works":["https://openalex.org/W3201974589","https://openalex.org/W2118095785","https://openalex.org/W2129028194","https://openalex.org/W4226332603","https://openalex.org/W2052691802","https://openalex.org/W2302383703","https://openalex.org/W2390339210","https://openalex.org/W2079742462","https://openalex.org/W2156492252","https://openalex.org/W1500274462"],"abstract_inverted_index":{"An":[0],"ensemble":[1],"speaker":[2],"and":[3,18,131,157,229],"speaking":[4],"environment":[5,26,53,58,107,114,134,226],"modeling":[6,135],"(ESSEM)":[7],"approach":[8],"was":[9],"recently":[10],"developed.":[11],"This":[12],"ESSEM":[13,70,101,130,206,236,251],"process":[14],"consists":[15],"of":[16,36,46,98,129,143,223,259,273],"offline":[17,22],"online":[19,41,95,200,225],"phases.":[20],"The":[21],"phase":[23,42],"establishes":[24],"an":[25,221,253],"structure":[27,108],"using":[28,197,212,220],"speech":[29,74],"data":[30],"collected":[31],"under":[32,77,264],"a":[33,44,87,177,269],"wide":[34],"range":[35],"acoustic":[37,47,63,172],"conditions,":[38,69],"whereas":[39],"the":[40,51,56,61,73,94,99,112,121,126,133,138,149,153,158,182,187,191,198,213,224,233,242,279],"estimates":[43],"set":[45],"models":[48,64],"that":[49,196],"matches":[50],"testing":[52,68,266,282],"based":[54,90,216],"on":[55,186,190],"established":[57],"structure.":[59,115],"Since":[60,163],"estimated":[62],"accurately":[65],"characterize":[66,170],"particular":[67],"can":[71,204],"improve":[72,93],"recognition":[75],"performance":[76,210],"adverse":[78],"conditions.":[79],"In":[80],"this":[81],"work,":[82],"we":[83,117,174,194],"propose":[84,118],"two":[85],"maximum":[86],"posteriori":[88],"(MAP)":[89],"algorithms":[91],"to":[92,110,119,124,169,180,207,240,262,275],"estimation":[96,203],"part":[97],"original":[100,113],"framework.":[102],"We":[103],"first":[104],"develop":[105],"MAP-based":[106,199,235,250],"adaptation":[109,228],"refine":[111],"Next,":[116],"utilize":[120],"MAP":[122,139],"criterion":[123],"estimate":[125],"mapping":[127,201,230],"function":[128,202,231],"enhance":[132],"capability.":[136],"For":[137],"estimation,":[140,232],"three":[141,183,280],"types":[142],"priors":[144],"are":[145,148],"derived;":[146],"they":[147],"clustered":[150],"prior":[151,155,160,165],"(CP),":[152],"sequential":[154],"(SP),":[156],"hierarchical":[159],"(HP)":[161],"densities.":[162],"each":[164],"density":[166],"is":[167,238],"able":[168],"specific":[171],"knowledge,":[173],"further":[175],"derive":[176],"combination":[178],"mechanism":[179],"integrate":[181],"priors.":[184],"Based":[185],"experimental":[188],"results":[189],"Aurora-2":[192],"task,":[193],"verify":[195],"enable":[205],"achieve":[208],"better":[209],"than":[211],"maximum-likelihood":[214],"(ML)":[215],"counterpart.":[217],"Moreover,":[218],"by":[219],"integration":[222],"structuring":[227],"proposed":[234],"framework":[237],"found":[239],"provide":[241],"best":[243],"performance.":[244],"Compared":[245],"with":[246],"our":[247],"baseline":[248],"results,":[249],"achieves":[252],"average":[254],"word":[255],"error":[256],"rate":[257],"reduction":[258],"15.53%":[260],"(5.41":[261],"4.57%)":[263],"50":[265],"conditions":[267],"at":[268],"signal-to-noise":[270],"ratio":[271],"(SNR)":[272],"0":[274],"20":[276],"dB":[277],"over":[278],"standardized":[281],"sets.":[283]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
