{"id":"https://openalex.org/W2105831132","doi":"https://doi.org/10.1109/iscslp.2010.5684839","title":"Problems of modeling phone deletion in conversational speech for speech recognition","display_name":"Problems of modeling phone deletion in conversational speech for speech recognition","publication_year":2010,"publication_date":"2010-11-01","ids":{"openalex":"https://openalex.org/W2105831132","doi":"https://doi.org/10.1109/iscslp.2010.5684839","mag":"2105831132"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2010.5684839","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2010.5684839","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 7th International Symposium on Chinese Spoken Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059141717","display_name":"Brian Mak","orcid":"https://orcid.org/0000-0001-6787-5555"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Brian Mak","raw_affiliation_strings":["Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038062913","display_name":"Tom Ko","orcid":"https://orcid.org/0000-0002-5324-8961"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Tom Ko","raw_affiliation_strings":["Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5059141717"],"corresponding_institution_ids":["https://openalex.org/I200769079"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13292123,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"114","last_page":"118"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9659000039100647,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.8208001852035522},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7805616855621338},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.721720814704895},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.714961051940918},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6003361940383911},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5920810103416443},{"id":"https://openalex.org/keywords/surprise","display_name":"Surprise","score":0.5901976227760315},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5415850281715393},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5032441020011902},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.46191099286079407},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.4389982223510742},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4183777868747711},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3519997000694275},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.31129950284957886},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1316089928150177},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.13009405136108398},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.10117915272712708}],"concepts":[{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.8208001852035522},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7805616855621338},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.721720814704895},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.714961051940918},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6003361940383911},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5920810103416443},{"id":"https://openalex.org/C2780343955","wikidata":"https://www.wikidata.org/wiki/Q333173","display_name":"Surprise","level":2,"score":0.5901976227760315},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5415850281715393},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5032441020011902},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.46191099286079407},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.4389982223510742},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4183777868747711},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3519997000694275},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.31129950284957886},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1316089928150177},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.13009405136108398},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.10117915272712708},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iscslp.2010.5684839","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2010.5684839","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 7th International Symposium on Chinese Spoken Language Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-35426","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-35426","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W40804352","https://openalex.org/W943204654","https://openalex.org/W1487082501","https://openalex.org/W1608231129","https://openalex.org/W1631260214","https://openalex.org/W2061937230","https://openalex.org/W2121464381","https://openalex.org/W2141970127","https://openalex.org/W2154478440","https://openalex.org/W2155963197","https://openalex.org/W2166637769","https://openalex.org/W2406143854","https://openalex.org/W6636811518","https://openalex.org/W6678149410","https://openalex.org/W6682900024"],"related_works":["https://openalex.org/W1566315437","https://openalex.org/W2594897229","https://openalex.org/W2151348424","https://openalex.org/W4221142855","https://openalex.org/W2050138804","https://openalex.org/W2129812225","https://openalex.org/W4290708361","https://openalex.org/W2523799048","https://openalex.org/W2155620340","https://openalex.org/W1494910745"],"abstract_inverted_index":{"Recently":[0],"we":[1,70,104],"proposed":[2],"a":[3,45,100],"novel":[4],"method":[5],"to":[6],"explicitly":[7],"model":[8,21],"the":[9,17,26,54,83],"phone":[10,55,76,111],"deletion":[11,56,77,112],"phenomenon":[12,57],"in":[13,34,61,67,78,87,117,121,128],"speech,":[14,36,69,123],"and":[15,63,124],"introduced":[16],"context-dependent":[18],"fragmented":[19],"word":[20,40],"(CD-FWM).":[22],"An":[23],"evaluation":[24],"on":[25,82],"WSJ1":[27],"Hub2":[28],"5K":[29],"task":[30,86],"shows":[31],"that":[32,53],"even":[33],"read":[35,68,118],"CD-FWM":[37,81,130],"could":[38],"reduce":[39],"error":[41],"rate":[42],"(WER)":[43],"by":[44],"relative":[46],"10.3%.":[47],"Since":[48],"it":[49],"is":[50,58,97,114],"generally":[51],"expected":[52],"more":[59,115],"pronounced":[60],"conversational":[62,122,133],"spontaneous":[64],"speech":[65,119],"than":[66,120],"extend":[71],"our":[72,91],"investigation":[73],"of":[74,102],"modeling":[75,113],"conversation":[79],"using":[80],"SVitchboard":[84],"500-word":[85],"this":[88],"paper.":[89],"To":[90],"surprise,":[92],"much":[93],"smaller":[94],"recognition":[95],"gain":[96],"obtained.":[98],"Through":[99],"series":[101],"analyses,":[103],"present":[105],"some":[106],"plausible":[107],"explanations":[108],"for":[109,131],"why":[110],"successful":[116],"suggest":[125],"future":[126],"directions":[127],"improving":[129],"recognizing":[132],"speech.":[134]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
