{"id":"https://openalex.org/W2061937230","doi":"https://doi.org/10.1109/icassp.2010.5495131","title":"Improving speech recognition by explicit modeling of phone deletions","display_name":"Improving speech recognition by explicit modeling of phone deletions","publication_year":2010,"publication_date":"2010-01-01","ids":{"openalex":"https://openalex.org/W2061937230","doi":"https://doi.org/10.1109/icassp.2010.5495131","mag":"2061937230"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2010.5495131","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2010.5495131","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038062913","display_name":"Tom Ko","orcid":"https://orcid.org/0000-0002-5324-8961"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Tom Ko","raw_affiliation_strings":["Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059141717","display_name":"Brian Mak","orcid":"https://orcid.org/0000-0001-6787-5555"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Brian Mak","raw_affiliation_strings":["Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Hong Kong University of Science and Technology, Hong Kong, China","institution_ids":["https://openalex.org/I200769079"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, the Hong Kong University of Science and Technology, Clear Water Bay, Hong Kong","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5038062913"],"corresponding_institution_ids":["https://openalex.org/I200769079"],"apc_list":null,"apc_paid":null,"fwci":1.3531,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.84413966,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"4858","last_page":"4861"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.8563967943191528},{"id":"https://openalex.org/keywords/syllable","display_name":"Syllable","score":0.8355507850646973},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.8281505107879639},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.8257691264152527},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.751913845539093},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6696950197219849},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5922124981880188},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5166983604431152},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4058614671230316},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14729997515678406},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.13036492466926575},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.05806511640548706}],"concepts":[{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.8563967943191528},{"id":"https://openalex.org/C109089402","wikidata":"https://www.wikidata.org/wiki/Q8188","display_name":"Syllable","level":2,"score":0.8355507850646973},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.8281505107879639},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.8257691264152527},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.751913845539093},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6696950197219849},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5922124981880188},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5166983604431152},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4058614671230316},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14729997515678406},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.13036492466926575},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.05806511640548706},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2010.5495131","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2010.5495131","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-6561","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-6561","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4000000059604645,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W3274920","https://openalex.org/W40804352","https://openalex.org/W83248749","https://openalex.org/W1608231129","https://openalex.org/W2121464381","https://openalex.org/W2141970127","https://openalex.org/W2154478440","https://openalex.org/W2155963197","https://openalex.org/W2158286329","https://openalex.org/W2166637769","https://openalex.org/W2167200294","https://openalex.org/W2167715705","https://openalex.org/W2406143854","https://openalex.org/W2888226713","https://openalex.org/W6682900024","https://openalex.org/W6753776127"],"related_works":["https://openalex.org/W2514064218","https://openalex.org/W2094188777","https://openalex.org/W2112609279","https://openalex.org/W1581825163","https://openalex.org/W1483316057","https://openalex.org/W2061937230","https://openalex.org/W2309273277","https://openalex.org/W2366310385","https://openalex.org/W2399404538","https://openalex.org/W2132658536"],"abstract_inverted_index":{"In":[0,72],"a":[1,34,124],"paper":[2],"published":[3],"by":[4,90],"Greenberg":[5],"in":[6,12,68,119],"1998,":[7],"it":[8],"was":[9,88],"said":[10],"that":[11,110],"conversational":[13],"speech,":[14,121],"phone":[15,65,86,117],"deletion":[16,26,87],"rate":[17,27,127],"may":[18],"go":[19],"as":[20,22],"high":[21],"12%":[23],"whereas":[24],"syllable":[25,39,47],"is":[28],"about":[29],"1%.":[30],"The":[31],"finding":[32],"prompted":[33],"new":[35],"research":[36],"direction":[37],"of":[38,96,116,129],"modeling":[40],"for":[41,93],"speech":[42],"recognition.":[43],"To":[44],"date,":[45],"the":[46,56],"approach":[48],"has":[49],"not":[50],"yet":[51],"fulfilled":[52],"its":[53],"promise.":[54],"On":[55],"other":[57],"hand,":[58],"there":[59],"were":[60,78],"few":[61],"attempts":[62],"to":[63],"model":[64],"deletions":[66,118],"explicitly":[67],"current":[69],"ASR":[70],"systems.":[71],"this":[73,113],"paper,":[74],"fragmented":[75],"word":[76,125],"models":[77],"derived":[79],"from":[80],"well-trained":[81],"cross-word":[82],"triphone":[83],"models,":[84],"and":[85],"implemented":[89],"skip":[91],"arcs":[92],"words":[94],"consisting":[95],"at":[97],"least":[98],"four":[99],"phonemes.":[100],"An":[101],"evaluation":[102],"on":[103],"CSR-II":[104],"WSJ1":[105],"Hub2":[106],"5K":[107],"task":[108],"shows":[109],"even":[111],"with":[112],"limited":[114],"implementation":[115],"read":[120],"we":[122],"obtained":[123],"error":[126],"reduction":[128],"6.73%.":[130]},"counts_by_year":[{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
