{"id":"https://openalex.org/W2965885792","doi":"https://doi.org/10.1109/o-cocosda46868.2019.9041202","title":"Fast and Accurate Capitalization and Punctuation for Automatic Speech Recognition Using Transformer and Chunk Merging","display_name":"Fast and Accurate Capitalization and Punctuation for Automatic Speech Recognition Using Transformer and Chunk Merging","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2965885792","doi":"https://doi.org/10.1109/o-cocosda46868.2019.9041202","mag":"2965885792"},"language":"en","primary_location":{"id":"doi:10.1109/o-cocosda46868.2019.9041202","is_oa":false,"landing_page_url":"https://doi.org/10.1109/o-cocosda46868.2019.9041202","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 22nd Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1908.02404","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091142923","display_name":"Binh P. Nguyen","orcid":"https://orcid.org/0000-0001-6203-6664"},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Binh Nguyen","raw_affiliation_strings":["Hanoi University of Science and Technology,Vietnam","Hanoi University of Science and Technology, Vietnam#TAB#"],"affiliations":[{"raw_affiliation_string":"Hanoi University of Science and Technology,Vietnam","institution_ids":["https://openalex.org/I94518387"]},{"raw_affiliation_string":"Hanoi University of Science and Technology, Vietnam#TAB#","institution_ids":["https://openalex.org/I94518387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040635512","display_name":"Vu Bao Hung Nguyen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vu Bao Hung Nguyen","raw_affiliation_strings":["Vietnam Artificial Intelligence System,Vietnam"],"affiliations":[{"raw_affiliation_string":"Vietnam Artificial Intelligence System,Vietnam","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048931285","display_name":"Hien D. Nguyen","orcid":"https://orcid.org/0000-0002-8527-0602"},"institutions":[{"id":"https://openalex.org/I4210115718","display_name":"Thai Nguyen University","ror":"https://ror.org/02128gy91","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210115718"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Hien Nguyen","raw_affiliation_strings":["Thai Nguyen University,Vietnam"],"affiliations":[{"raw_affiliation_string":"Thai Nguyen University,Vietnam","institution_ids":["https://openalex.org/I4210115718"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067573637","display_name":"Pham Ngoc Phuong","orcid":"https://orcid.org/0000-0002-7741-3570"},"institutions":[{"id":"https://openalex.org/I4210115718","display_name":"Thai Nguyen University","ror":"https://ror.org/02128gy91","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210115718"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Pham Ngoc Phuong","raw_affiliation_strings":["Thai Nguyen University,Vietnam"],"affiliations":[{"raw_affiliation_string":"Thai Nguyen University,Vietnam","institution_ids":["https://openalex.org/I4210115718"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005800339","display_name":"The-Loc Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I29199639","display_name":"Hanoi University of Mining and Geology","ror":"https://ror.org/01rw3qm79","country_code":"VN","type":"education","lineage":["https://openalex.org/I29199639"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"The-Loc Nguyen","raw_affiliation_strings":["Hanoi University, of Mining and Geology,Vietnam","[Hanoi University of Mining and Geology, Vietnam]"],"affiliations":[{"raw_affiliation_string":"Hanoi University, of Mining and Geology,Vietnam","institution_ids":["https://openalex.org/I29199639"]},{"raw_affiliation_string":"[Hanoi University of Mining and Geology, Vietnam]","institution_ids":["https://openalex.org/I29199639"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102847246","display_name":"Quoc Truong","orcid":"https://orcid.org/0000-0003-1472-1370"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quoc Truong Do","raw_affiliation_strings":["Vietnam Artificial Intelligence System,Vietnam"],"affiliations":[{"raw_affiliation_string":"Vietnam Artificial Intelligence System,Vietnam","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110641459","display_name":"L\u01b0\u01a1ng Chi","orcid":null},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Luong Chi Mai","raw_affiliation_strings":["University of Science and Technology of Hanoi,Vietnam","University of Science and Technology of Hanoi, Vietnam"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of Hanoi,Vietnam","institution_ids":["https://openalex.org/I94518387"]},{"raw_affiliation_string":"University of Science and Technology of Hanoi, Vietnam","institution_ids":["https://openalex.org/I94518387"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5091142923"],"corresponding_institution_ids":["https://openalex.org/I94518387"],"apc_list":null,"apc_paid":null,"fwci":1.5913,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.87820869,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/punctuation","display_name":"Punctuation","score":0.9423883557319641},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7984525561332703},{"id":"https://openalex.org/keywords/capitalization","display_name":"Capitalization","score":0.7354972958564758},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6665471792221069},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6233204007148743},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.6228330731391907},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.5950640439987183},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5592105984687805},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.5546402931213379},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5053043961524963},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4251987040042877},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.14960765838623047},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.089138925075531},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06600543856620789}],"concepts":[{"id":"https://openalex.org/C540372491","wikidata":"https://www.wikidata.org/wiki/Q82622","display_name":"Punctuation","level":2,"score":0.9423883557319641},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7984525561332703},{"id":"https://openalex.org/C2779137862","wikidata":"https://www.wikidata.org/wiki/Q425951","display_name":"Capitalization","level":2,"score":0.7354972958564758},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6665471792221069},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6233204007148743},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.6228330731391907},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.5950640439987183},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5592105984687805},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.5546402931213379},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5053043961524963},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4251987040042877},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.14960765838623047},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.089138925075531},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06600543856620789},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/o-cocosda46868.2019.9041202","is_oa":false,"landing_page_url":"https://doi.org/10.1109/o-cocosda46868.2019.9041202","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 22nd Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1908.02404","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1908.02404","pdf_url":"https://arxiv.org/pdf/1908.02404","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2965885792","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1908.02404","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1908.02404","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1908.02404","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1908.02404","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1908.02404","pdf_url":"https://arxiv.org/pdf/1908.02404","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6100000143051147}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2965885792.pdf","grobid_xml":"https://content.openalex.org/works/W2965885792.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W886998232","https://openalex.org/W2130942839","https://openalex.org/W2133564696","https://openalex.org/W2143017621","https://openalex.org/W2147880316","https://openalex.org/W2166116787","https://openalex.org/W2398104528","https://openalex.org/W2403334028","https://openalex.org/W2407834842","https://openalex.org/W2553303224","https://openalex.org/W2745785989","https://openalex.org/W2857028992","https://openalex.org/W2962989741","https://openalex.org/W2963212250","https://openalex.org/W2963403868","https://openalex.org/W2963418779","https://openalex.org/W6624114792","https://openalex.org/W6679436768","https://openalex.org/W6684662674","https://openalex.org/W6712411474","https://openalex.org/W6713441181","https://openalex.org/W6714054690","https://openalex.org/W6729956949","https://openalex.org/W6739901393","https://openalex.org/W6749669830","https://openalex.org/W6752909555"],"related_works":["https://openalex.org/W3011222885","https://openalex.org/W2513522215","https://openalex.org/W2993229155","https://openalex.org/W2398104528","https://openalex.org/W2166116787","https://openalex.org/W2963403868","https://openalex.org/W2938722449","https://openalex.org/W2406343628","https://openalex.org/W2403334028","https://openalex.org/W1587490638","https://openalex.org/W3138583354","https://openalex.org/W3045571807","https://openalex.org/W2545909488","https://openalex.org/W2781510043","https://openalex.org/W3108216882","https://openalex.org/W2057169877","https://openalex.org/W606542161","https://openalex.org/W3082144843","https://openalex.org/W2626964143","https://openalex.org/W3105804405"],"abstract_inverted_index":{"In":[0,67],"recent":[1],"years,":[2],"studies":[3],"on":[4,17,88,123],"automatic":[5],"speech":[6,19],"recognition":[7],"(ASR)":[8],"have":[9],"shown":[10],"outstanding":[11],"results":[12],"that":[13,94,103,128],"reach":[14],"human":[15],"parity":[16],"short":[18],"segments.":[20],"However,":[21],"there":[22],"are":[23],"still":[24],"difficulties":[25,54],"in":[26,108,115,135],"standardizing":[27],"the":[28,47,76,119,129],"output":[29,49],"of":[30],"ASR":[31,48,82],"such":[32,60],"as":[33,61],"capitalization":[34,79,107],"and":[35,51,64,78,91,106,111,138],"punctuation":[36,77,105],"restoration":[37],"for":[38,55,80],"long-speech":[39,81],"transcription.":[40,83],"The":[41,84],"problems":[42],"obstruct":[43],"readers":[44],"to":[45,74,97],"understand":[46],"semantically":[50],"also":[52],"cause":[53],"natural":[56],"language":[57],"processing":[58],"models":[59,90],"NER,":[62],"POS":[63],"semantic":[65],"parsing.":[66],"this":[68],"paper,":[69],"we":[70],"propose":[71],"a":[72,100],"method":[73,85],"restore":[75],"is":[86],"based":[87],"Transformer":[89],"chunk":[92],"merging":[93],"allows":[95],"us":[96],"(1),":[98],"build":[99],"single":[101],"model":[102],"performs":[104],"one":[109],"go,":[110],"(2),":[112],"perform":[113],"decoding":[114,139],"parallel":[116],"while":[117],"improving":[118],"prediction":[120],"accuracy.":[121],"Experiments":[122],"British":[124],"National":[125],"Corpus":[126],"showed":[127],"proposed":[130],"approach":[131],"outperforms":[132],"existing":[133],"methods":[134],"both":[136],"accuracy":[137],"speed.":[140]},"counts_by_year":[{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":7}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
