{"id":"https://openalex.org/W2085406278","doi":"https://doi.org/10.1109/icassp.2014.6854050","title":"Multi-view learning with supervision for transformed bottleneck features","display_name":"Multi-view learning with supervision for transformed bottleneck features","publication_year":2014,"publication_date":"2014-05-01","ids":{"openalex":"https://openalex.org/W2085406278","doi":"https://doi.org/10.1109/icassp.2014.6854050","mag":"2085406278"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2014.6854050","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6854050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063457506","display_name":"Raman Arora","orcid":"https://orcid.org/0000-0003-2002-3923"},"institutions":[{"id":"https://openalex.org/I160992636","display_name":"Toyota Technological Institute at Chicago","ror":"https://ror.org/02sn5gb64","country_code":"US","type":"education","lineage":["https://openalex.org/I160992636"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Raman Arora","raw_affiliation_strings":["TTI-Chicago, Chicago, IL","TTI-Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"TTI-Chicago, Chicago, IL","institution_ids":["https://openalex.org/I160992636"]},{"raw_affiliation_string":"TTI-Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I160992636"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015602781","display_name":"Karen Livescu","orcid":"https://orcid.org/0000-0003-4962-946X"},"institutions":[{"id":"https://openalex.org/I160992636","display_name":"Toyota Technological Institute at Chicago","ror":"https://ror.org/02sn5gb64","country_code":"US","type":"education","lineage":["https://openalex.org/I160992636"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Karen Livescu","raw_affiliation_strings":["TTI-Chicago, Chicago, IL","TTI-Chicago, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"TTI-Chicago, Chicago, IL","institution_ids":["https://openalex.org/I160992636"]},{"raw_affiliation_string":"TTI-Chicago, Chicago, IL, USA","institution_ids":["https://openalex.org/I160992636"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5063457506"],"corresponding_institution_ids":["https://openalex.org/I160992636"],"apc_list":null,"apc_paid":null,"fwci":6.1351,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.96437182,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2499","last_page":"2503"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.851164698600769},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7529146075248718},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5606668591499329},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5265660285949707},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5029630064964294},{"id":"https://openalex.org/keywords/extension","display_name":"Extension (predicate logic)","score":0.47708186507225037},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4553852081298828},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.4241049587726593},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4103415608406067},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36476343870162964},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33540019392967224}],"concepts":[{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.851164698600769},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7529146075248718},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5606668591499329},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5265660285949707},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5029630064964294},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.47708186507225037},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4553852081298828},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.4241049587726593},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4103415608406067},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36476343870162964},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33540019392967224},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2014.6854050","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2014.6854050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7400000095367432}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W6908809","https://openalex.org/W139227689","https://openalex.org/W1497960466","https://openalex.org/W1523385540","https://openalex.org/W1533861849","https://openalex.org/W1549321558","https://openalex.org/W1589867908","https://openalex.org/W1603575269","https://openalex.org/W1664345024","https://openalex.org/W1975077471","https://openalex.org/W1984983329","https://openalex.org/W1986194954","https://openalex.org/W1995735739","https://openalex.org/W2025341678","https://openalex.org/W2033908685","https://openalex.org/W2042608483","https://openalex.org/W2063036810","https://openalex.org/W2071207147","https://openalex.org/W2080400971","https://openalex.org/W2098817692","https://openalex.org/W2100235303","https://openalex.org/W2152051032","https://openalex.org/W2153890400","https://openalex.org/W2155277636","https://openalex.org/W2159746936","https://openalex.org/W2159948109","https://openalex.org/W2160594205","https://openalex.org/W2165386352","https://openalex.org/W2165712214","https://openalex.org/W2231075402","https://openalex.org/W2296654356","https://openalex.org/W2405732242","https://openalex.org/W2406820985","https://openalex.org/W3087819914","https://openalex.org/W4237723258","https://openalex.org/W4237951138","https://openalex.org/W6600284362","https://openalex.org/W6629823275","https://openalex.org/W6631216910","https://openalex.org/W6631943919","https://openalex.org/W6635242571","https://openalex.org/W6635968555","https://openalex.org/W6713704110","https://openalex.org/W6783563602"],"related_works":["https://openalex.org/W4317548404","https://openalex.org/W3022007134","https://openalex.org/W2130553454","https://openalex.org/W2087783760","https://openalex.org/W2033364610","https://openalex.org/W2797776314","https://openalex.org/W3163689946","https://openalex.org/W2153927146","https://openalex.org/W3104108945","https://openalex.org/W4390190783"],"abstract_inverted_index":{"Previous":[0],"work":[1],"has":[2],"shown":[3],"that":[4,24,113,138],"acoustic":[5,157],"features":[6,81,141],"can":[7,60],"be":[8,61],"improved":[9],"by":[10],"unsupervised":[11],"learning":[12,76,156],"of":[13,78,85,101,111,132],"transformations":[14,77],"based":[15],"on":[16,127],"canonical":[17],"correlation":[18],"analysis":[19],"(CCA)":[20],"using":[21,145],"articulatory":[22,87,119,153],"measurements":[23,88,120,154],"are":[25,46],"available":[26,48],"at":[27,49],"training":[28,50,65,94],"time.":[29,51],"In":[30],"this":[31,36],"paper,":[32],"we":[33],"investigate":[34],"whether":[35],"second":[37],"view":[38],"(articulatory":[39],"data)":[40],"still":[41],"helps":[42],"even":[43],"when":[44,63],"labels":[45,91,117,149],"also":[47],"We":[52,70],"begin":[53],"with":[54],"strong":[55],"baseline":[56],"bottleneck":[57,80],"features,":[58],"which":[59],"learned":[62,140],"the":[64,79,83,93,116,130,139,148,152],"set":[66],"is":[67],"phonetically":[68],"labeled.":[69],"then":[71],"compare":[72],"several":[73],"options":[74],"for":[75,92,155],"in":[82],"presence":[84],"both":[86],"and":[89,103,118],"phonetic":[90],"data.":[95],"The":[96],"methods":[97],"compared":[98],"include":[99],"combinations":[100],"LDA":[102],"CCA,":[104],"as":[105,107,121],"well":[106],"a":[108],"three-view":[109],"extension":[110],"CCA":[112],"simultaneously":[114],"uses":[115],"additional":[122],"views.":[123],"Phonetic":[124],"recognition":[125],"experiments":[126],"data":[128],"from":[129],"University":[131],"Wisconsin":[133],"X-ray":[134],"microbeam":[135],"database":[136],"show":[137],"improve":[142],"performance":[143],"over":[144],"either":[146],"just":[147,151],"or":[150],"transformations.":[158]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":9},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
