{"id":"https://openalex.org/W4391742860","doi":"https://doi.org/10.1109/imcom60618.2024.10418445","title":"Efficient Ensemble for Multimodal Punctuation Restoration using Time-Delay Neural Network","display_name":"Efficient Ensemble for Multimodal Punctuation Restoration using Time-Delay Neural Network","publication_year":2024,"publication_date":"2024-01-03","ids":{"openalex":"https://openalex.org/W4391742860","doi":"https://doi.org/10.1109/imcom60618.2024.10418445"},"language":"en","primary_location":{"id":"doi:10.1109/imcom60618.2024.10418445","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/imcom60618.2024.10418445","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 18th International Conference on Ubiquitous Information Management and Communication (IMCOM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115599670","display_name":"Xing Yi Liu","orcid":"https://orcid.org/0009-0005-3201-5412"},"institutions":[{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xing Yi Liu","raw_affiliation_strings":["Columbia University,Department of Computer Science,New York,USA","Department of Computer Science, Columbia University, New York, USA"],"affiliations":[{"raw_affiliation_string":"Columbia University,Department of Computer Science,New York,USA","institution_ids":["https://openalex.org/I78577930"]},{"raw_affiliation_string":"Department of Computer Science, Columbia University, New York, USA","institution_ids":["https://openalex.org/I78577930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030917082","display_name":"Homayoon Beigi","orcid":"https://orcid.org/0000-0003-0127-2385"},"institutions":[{"id":"https://openalex.org/I4210160724","display_name":"Access Technologies","ror":"https://ror.org/05kt92j68","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210160724"]},{"id":"https://openalex.org/I78577930","display_name":"Columbia University","ror":"https://ror.org/00hj8s172","country_code":"US","type":"education","lineage":["https://openalex.org/I78577930"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Homayoon Beigi","raw_affiliation_strings":["Columbia University,Department of Computer Science,New York,USA","Recognition Technologies, Inc., South Salem, USA","Department of Computer Science, Columbia University, New York, USA"],"affiliations":[{"raw_affiliation_string":"Columbia University,Department of Computer Science,New York,USA","institution_ids":["https://openalex.org/I78577930"]},{"raw_affiliation_string":"Recognition Technologies, Inc., South Salem, USA","institution_ids":["https://openalex.org/I4210160724"]},{"raw_affiliation_string":"Department of Computer Science, Columbia University, New York, USA","institution_ids":["https://openalex.org/I78577930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5115599670"],"corresponding_institution_ids":["https://openalex.org/I78577930"],"apc_list":null,"apc_paid":null,"fwci":0.3651,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.6117538,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"13","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13018","display_name":"Seismology and Earthquake Studies","score":0.8805000185966492,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13018","display_name":"Seismology and Earthquake Studies","score":0.8805000185966492,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.8680999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/punctuation","display_name":"Punctuation","score":0.8035008907318115},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.692188024520874},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5653756260871887},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.4449295699596405},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3859759271144867}],"concepts":[{"id":"https://openalex.org/C540372491","wikidata":"https://www.wikidata.org/wiki/Q82622","display_name":"Punctuation","level":2,"score":0.8035008907318115},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.692188024520874},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5653756260871887},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.4449295699596405},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3859759271144867}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/imcom60618.2024.10418445","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/imcom60618.2024.10418445","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 18th International Conference on Ubiquitous Information Management and Communication (IMCOM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W102958777","https://openalex.org/W1554540371","https://openalex.org/W2105482032","https://openalex.org/W2117671523","https://openalex.org/W2169187092","https://openalex.org/W2398104528","https://openalex.org/W2403334028","https://openalex.org/W2513522215","https://openalex.org/W2586117383","https://openalex.org/W2705373224","https://openalex.org/W2741483887","https://openalex.org/W2799473636","https://openalex.org/W2888942278","https://openalex.org/W2937326859","https://openalex.org/W2938722449","https://openalex.org/W2973072704","https://openalex.org/W3036601975","https://openalex.org/W3037101098","https://openalex.org/W3092085609","https://openalex.org/W3094965760","https://openalex.org/W3095073040","https://openalex.org/W3101648800","https://openalex.org/W3106905592","https://openalex.org/W3185113268","https://openalex.org/W4221166827","https://openalex.org/W4281384017","https://openalex.org/W4296068804","https://openalex.org/W4302327898","https://openalex.org/W4318472777","https://openalex.org/W4372260226","https://openalex.org/W4385822993","https://openalex.org/W6631362777","https://openalex.org/W6635223454","https://openalex.org/W6684662674","https://openalex.org/W6755207826","https://openalex.org/W6780218876"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2936002343","https://openalex.org/W2188883480","https://openalex.org/W1592364192","https://openalex.org/W656840002","https://openalex.org/W1605117403","https://openalex.org/W2381416480","https://openalex.org/W2380599343","https://openalex.org/W2181793145","https://openalex.org/W3163320880"],"abstract_inverted_index":{"Punctuation":[0],"restoration":[1],"plays":[2],"an":[3,30,113],"essential":[4],"role":[5],"in":[6],"the":[7,41,92,110,124],"post-processing":[8],"procedure":[9],"of":[10,54,109],"automatic":[11],"speech":[12,62],"recognition,":[13],"but":[14],"model":[15,44],"efficiency":[16,100],"is":[17,130],"a":[18,34,52,61,106],"key":[19],"requirement":[20],"for":[21,71,94],"this":[22],"task.":[23],"To":[24],"that":[25,39,115],"end,":[26],"we":[27,90],"present":[28],"EfficientPunct,":[29],"ensemble":[31,114],"method":[32],"with":[33,112],"multimodal":[35,125],"time-delay":[36],"neural":[37],"network":[38,57],"outperforms":[40],"current":[42],"best":[43],"by":[45],"1.0":[46],"F1":[47],"points,":[48],"using":[49,84],"less":[50],"than":[51,123],"tenth":[53],"its":[55],"inference":[56],"parameters.":[58],"We":[59],"streamline":[60],"recognizer":[63],"to":[64,78],"efficiently":[65],"output":[66],"hidden":[67],"layer":[68],"acoustic":[69],"embeddings":[70],"punctuation":[72],"restoration,":[73],"as":[74,76],"well":[75],"BERT":[77],"extract":[79],"meaningful":[80],"text":[81],"embeddings.":[82],"By":[83],"forced":[85],"alignment":[86],"and":[87,101],"temporal":[88],"convolutions,":[89],"eliminate":[91],"need":[93],"attention-based":[95],"fusion,":[96],"greatly":[97],"increasing":[98],"computational":[99],"raising":[102],"performance.":[103],"EfficientPunct":[104],"sets":[105],"new":[107],"state":[108],"art":[111],"weights":[116],"BERT's":[117],"purely":[118],"language-based":[119],"predictions":[120],"slightly":[121],"more":[122],"network's":[126],"predictions.":[127],"Our":[128],"code":[129],"available":[131],"at":[132],"https://github.com/lxy-peter/EfficientPunct.":[133]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2024-02-13T00:00:00"}
