{"id":"https://openalex.org/W4386794887","doi":"https://doi.org/10.48550/arxiv.2309.07677","title":"Aligning Speakers: Evaluating and Visualizing Text-based Diarization Using Efficient Multiple Sequence Alignment (Extended Version)","display_name":"Aligning Speakers: Evaluating and Visualizing Text-based Diarization Using Efficient Multiple Sequence Alignment (Extended Version)","publication_year":2023,"publication_date":"2023-09-14","ids":{"openalex":"https://openalex.org/W4386794887","doi":"https://doi.org/10.48550/arxiv.2309.07677"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2309.07677","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.07677","pdf_url":"https://arxiv.org/pdf/2309.07677","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2309.07677","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100389824","display_name":"Chen Gong","orcid":"https://orcid.org/0000-0001-9305-6908"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gong, Chen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105068598","display_name":"Peilin Wu","orcid":"https://orcid.org/0009-0008-9225-787X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Peilin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101829031","display_name":"Jinho D. Choi","orcid":"https://orcid.org/0000-0003-2693-6934"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choi, Jinho D.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100389824"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8181993365287781},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.7139431238174438},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5519425868988037},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5187347531318665},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5137094259262085},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.43886786699295044},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43768972158432007},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4212465286254883},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4133821129798889},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.11921137571334839}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8181993365287781},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.7139431238174438},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5519425868988037},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5187347531318665},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5137094259262085},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.43886786699295044},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43768972158432007},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4212465286254883},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4133821129798889},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.11921137571334839},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2309.07677","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.07677","pdf_url":"https://arxiv.org/pdf/2309.07677","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2309.07677","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2309.07677","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2309.07677","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.07677","pdf_url":"https://arxiv.org/pdf/2309.07677","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6899999976158142}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4386794887.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2529301793","https://openalex.org/W1556857061","https://openalex.org/W2177420620","https://openalex.org/W4296594783","https://openalex.org/W4387225169","https://openalex.org/W4380994539","https://openalex.org/W4308671730","https://openalex.org/W2944691285","https://openalex.org/W2915347927","https://openalex.org/W3151768066"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,69,78],"novel":[4],"evaluation":[5],"approach":[6],"to":[7,62,67,96],"text-based":[8],"speaker":[9],"diarization":[10],"(SD),":[11],"tackling":[12],"the":[13,90,97,130,136],"limitations":[14],"of":[15,59,132,138],"traditional":[16],"metrics":[17,30,55],"that":[18,85],"do":[19],"not":[20],"account":[21],"for":[22,113,119],"any":[23],"contextual":[24],"information":[25],"in":[26,49,73,89,129],"text.":[27],"Two":[28],"new":[29],"are":[31],"proposed,":[32],"Text-based":[33],"Diarization":[34,38],"Error":[35],"Rate":[36],"and":[37,43,51,117,121],"F1,":[39],"which":[40,125],"perform":[41],"utterance-":[42],"word-level":[44],"evaluations":[45],"by":[46],"aligning":[47],"tokens":[48],"reference":[50,91],"hypothesis":[52,98],"transcripts.":[53],"Our":[54,102],"encompass":[56],"more":[57,70],"types":[58],"errors":[60],"compared":[61],"existing":[63],"ones,":[64],"allowing":[65],"us":[66],"make":[68],"comprehensive":[71],"analysis":[72],"SD.":[74],"To":[75],"align":[76],"tokens,":[77],"multiple":[79,87],"sequence":[80],"alignment":[81,95,115],"algorithm":[82,116],"is":[83,104],"introduced":[84],"supports":[86],"sequences":[88],"while":[92],"handling":[93],"high-dimensional":[94],"using":[99],"dynamic":[100],"programming.":[101],"work":[103],"packaged":[105],"into":[106],"two":[107],"tools,":[108],"align4d":[109],"providing":[110],"an":[111],"API":[112],"our":[114],"TranscribeView":[118],"visualizing":[120],"evaluating":[122],"SD":[123],"errors,":[124],"can":[126],"greatly":[127],"aid":[128],"creation":[131],"high-quality":[133],"data,":[134],"fostering":[135],"advancement":[137],"dialogue":[139],"systems.":[140]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2023-09-16T00:00:00"}
