{"id":"https://openalex.org/W2963590452","doi":"https://doi.org/10.21437/interspeech.2018-40","title":"Speech Recognition for Medical Conversations","display_name":"Speech Recognition for Medical Conversations","publication_year":2018,"publication_date":"2018-08-28","ids":{"openalex":"https://openalex.org/W2963590452","doi":"https://doi.org/10.21437/interspeech.2018-40","mag":"2963590452"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2018-40","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2018-40","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2018","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027763497","display_name":"Chung\u2010Cheng Chiu","orcid":"https://orcid.org/0000-0001-9729-4778"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chung-Cheng Chiu","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101403998","display_name":"Anshuman Tripathi","orcid":"https://orcid.org/0000-0002-4902-3719"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anshuman Tripathi","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070366042","display_name":"Katherine Chou","orcid":"https://orcid.org/0000-0002-0318-7857"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Katherine Chou","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023205465","display_name":"Chris Co","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chris Co","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112445699","display_name":"Navdeep Jaitly","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Navdeep Jaitly","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025389784","display_name":"Diana Jaunzeikare","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Diana Jaunzeikare","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023098355","display_name":"Anjuli Kannan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anjuli Kannan","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111455517","display_name":"Patrick Nguyen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patrick Nguyen","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108537573","display_name":"Ha\u015fim Sak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hasim Sak","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104349809","display_name":"Ananth Sankar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ananth Sankar","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007824431","display_name":"Justin Tansuwan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Justin Tansuwan","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110619222","display_name":"Nathan Wan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nathan Wan","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010253402","display_name":"Yonghui Wu","orcid":"https://orcid.org/0000-0002-6780-6135"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yonghui Wu","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100646177","display_name":"Xuedong Zhang","orcid":"https://orcid.org/0000-0003-2456-2342"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xuedong Zhang","raw_affiliation_strings":["{chungchengc, anshumant, kic, chrisco, ndjaitly,"],"affiliations":[{"raw_affiliation_string":"{chungchengc, anshumant, kic, chrisco, ndjaitly,","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5027763497"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.3525,"has_fulltext":false,"cited_by_count":69,"citation_normalized_percentile":{"value":0.97226892,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2972","last_page":"2976"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7307261824607849},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6598783135414124},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.37127065658569336}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7307261824607849},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6598783135414124},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37127065658569336}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2018-40","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2018-40","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2018","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W648786980","https://openalex.org/W1855892484","https://openalex.org/W2033256038","https://openalex.org/W2136439176","https://openalex.org/W2140943358","https://openalex.org/W2158069733","https://openalex.org/W2181417294","https://openalex.org/W2296545762","https://openalex.org/W2740281359","https://openalex.org/W2743392628","https://openalex.org/W2902584105","https://openalex.org/W2962765220","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2130043461","https://openalex.org/W2530322880","https://openalex.org/W1596801655"],"abstract_inverted_index":{"In":[0],"this":[1,21],"paper":[2],"we":[3,23,53,89],"document":[4],"our":[5],"experiences":[6],"with":[7],"developing":[8],"speech":[9],"recognition":[10],"for":[11,91,173],"medical":[12,166,175],"transcription":[13],"-a":[14,32],"system":[15,26],"that":[16,159],"automatically":[17],"transcribes":[18],"doctor-patient":[19],"conversations.Towards":[20],"goal,":[22],"built":[24],"a":[25,41,55,74,86,100,142],"along":[27],"two":[28],"different":[29],"methodological":[30],"lines":[31],"Connectionist":[33],"Temporal":[34],"Classification":[35],"(CTC)":[36],"phoneme":[37],"based":[38,48,112,115],"model":[39,103],"and":[40,44,69,97,125,128,148,168],"Listen":[42],"Attend":[43],"Spell":[45],"(LAS)":[46],"grapheme":[47],"model.To":[49],"train":[50],"these":[51],"models":[52,137,151,161],"used":[54],"corpus":[56],"of":[57,64,66,77,99,109,134,146],"anonymized":[58],"conversations":[59],"representing":[60],"approximately":[61],"14,000":[62],"hours":[63],"speech.Because":[65],"noisy":[67],"transcripts":[68],"alignments":[70],"in":[71,81],"the":[72,93,107,110,132,149],"corpus,":[73],"significant":[75],"amount":[76],"effort":[78],"was":[79,104],"invested":[80],"data":[82,95],"cleaning":[83],"issues.We":[84],"describe":[85],"two-stage":[87],"strategy":[88],"followed":[90],"segmenting":[92],"data.The":[94],"cleanup":[96],"development":[98],"matched":[101],"language":[102,135],"essential":[105],"to":[106,120,123,140,154],"success":[108],"CTC":[111],"models.The":[113],"LAS":[114,150],"models,":[116],"however":[117],"were":[118,138,152],"found":[119],"be":[121,171],"resilient":[122],"alignment":[124],"transcript":[126],"noise":[127],"did":[129],"not":[130],"require":[131],"use":[133],"models.CTC":[136],"able":[139,153],"achieve":[141,155],"word":[143],"error":[144],"rate":[145],"20.1%,":[147],"18.3%.Our":[156],"analysis":[157],"shows":[158],"both":[160],"perform":[162],"well":[163],"on":[164],"important":[165],"utterances":[167],"therefore":[169],"can":[170],"practical":[172],"transcribing":[174],"conversations.":[176]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":6}],"updated_date":"2026-01-16T23:16:36.188383","created_date":"2025-10-10T00:00:00"}
