{"id":"https://openalex.org/W2143033778","doi":"https://doi.org/10.1109/mmsp.2002.1203296","title":"A speech-centric perspective for human-computer interface","display_name":"A speech-centric perspective for human-computer interface","publication_year":2004,"publication_date":"2004-01-24","ids":{"openalex":"https://openalex.org/W2143033778","doi":"https://doi.org/10.1109/mmsp.2002.1203296","mag":"2143033778"},"language":"en","primary_location":{"id":"doi:10.1109/mmsp.2002.1203296","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmsp.2002.1203296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2002 IEEE Workshop on Multimedia Signal Processing.","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100671324","display_name":"Li Deng","orcid":"https://orcid.org/0000-0002-1014-0790"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"L. Deng","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111957484","display_name":"Alex Acero","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. Acero","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013069970","display_name":"Yanan Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Y. Wang","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060217537","display_name":"K. Wang","orcid":"https://orcid.org/0009-0002-1480-2373"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"K. Wang","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109215896","display_name":"Hsiao-Wuen Hon","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"H. Hon","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012153296","display_name":"Jasha Droppo","orcid":"https://orcid.org/0000-0001-6097-0090"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. Droppo","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113252773","display_name":"M. Mahajan","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M. Mahajan","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103158343","display_name":"Xuedong Huang","orcid":"https://orcid.org/0000-0003-4550-7908"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"X.D. Huang","raw_affiliation_strings":["Microsoft Research Limited, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Limited, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100671324"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.1302539,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"3","issue":null,"first_page":"263","last_page":"267"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9427000284194946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9427000284194946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7480423450469971},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.6586615443229675},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.616443932056427},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5323180556297302},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3802812397480011},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1832733452320099},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.08717235922813416}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7480423450469971},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.6586615443229675},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.616443932056427},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5323180556297302},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3802812397480011},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1832733452320099},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.08717235922813416},{"id":"https://openalex.org/C157915830","wikidata":"https://www.wikidata.org/wiki/Q2928001","display_name":"Bubble","level":2,"score":0.0},{"id":"https://openalex.org/C129307140","wikidata":"https://www.wikidata.org/wiki/Q6795880","display_name":"Maximum bubble pressure method","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mmsp.2002.1203296","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmsp.2002.1203296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2002 IEEE Workshop on Multimedia Signal Processing.","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W84880661","https://openalex.org/W204852497","https://openalex.org/W1522515958","https://openalex.org/W1950777589","https://openalex.org/W2109831181","https://openalex.org/W2116502454","https://openalex.org/W2151484683","https://openalex.org/W6603374476","https://openalex.org/W6635811418","https://openalex.org/W6676266797"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2149537132","https://openalex.org/W2376932109","https://openalex.org/W2018871932","https://openalex.org/W2001405890","https://openalex.org/W641279757","https://openalex.org/W370975646","https://openalex.org/W2382290278"],"abstract_inverted_index":{"Speech":[0],"technology":[1],"has":[2,19],"been":[3],"playing":[4],"a":[5,106,120,140],"central":[6],"role":[7],"in":[8,29,69,158],"enhancing":[9],"human-machine":[10],"interactions,":[11],"especially":[12],"for":[13,16,25,81],"small":[14],"devices":[15],"which":[17],"GUI":[18],"obvious":[20],"limitations.":[21],"The":[22],"speech-centric":[23,82],"perspective":[24],"human-computer":[26,84],"interface":[27,124],"advanced":[28],"this":[30,59],"paper":[31],"derives":[32],"from":[33,51],"the":[34,39,63,70,76,92,99,144],"view":[35],"that":[36,96,111],"speech":[37,132],"is":[38,105],"only":[40],"natural":[41],"and":[42,52,125,134,138],"expressive":[43],"modality":[44],"to":[45,48,53,114,143],"enable":[46],"people":[47],"access":[49],"information":[50],"interact":[54],"with":[55,150],"any":[56],"device.":[57],"In":[58,86],"paper,":[60],"we":[61,88],"describe":[62],"work":[64],"conducted":[65],"at":[66,75],"Microsoft":[67],"Research,":[68],"project":[71],"codenamed":[72],"Dr.Who,":[73],"aimed":[74],"development":[77],"of":[78,148],"enabling":[79],"technologies":[80],"multimodal":[83,121],"interaction.":[85],"particular,":[87],"present":[89],"MiPad":[90,104],"as":[91],"first":[93],"Dr.Who's":[94],"application":[95],"addresses":[97],"specifically":[98],"mobile":[100,108],"user":[101],"interaction":[102],"scenario.":[103],"wireless":[107],"PDA":[109],"prototype":[110],"enables":[112],"users":[113],"accomplish":[115],"many":[116],"common":[117],"tasks":[118],"using":[119],"spoken":[122,135],"language":[123,136],"wireless-data":[126],"technologies.":[127],"It":[128],"fully":[129],"integrates":[130],"continuous":[131],"recognition":[133],"understanding,":[137],"provides":[139],"novel":[141],"solution":[142],"current":[145],"prevailing":[146],"problem":[147],"pecking":[149],"tiny":[151],"styluses":[152],"or":[153,161],"typing":[154],"on":[155],"minuscule":[156],"keyboards":[157],"today's":[159],"PDAs":[160],"smart":[162],"phones.":[163]},"counts_by_year":[{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
