{"id":"https://openalex.org/W3174136362","doi":"https://doi.org/10.1109/taslp.2021.3093817","title":"Hybrid Speech and Text Analysis Methods for Speaker Change Detection","display_name":"Hybrid Speech and Text Analysis Methods for Speaker Change Detection","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3174136362","doi":"https://doi.org/10.1109/taslp.2021.3093817","mag":"3174136362"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2021.3093817","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3093817","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086774507","display_name":"Or Haim Anidjar","orcid":"https://orcid.org/0000-0002-7673-6511"},"institutions":[{"id":"https://openalex.org/I52170813","display_name":"Ariel University","ror":"https://ror.org/03nz8qe97","country_code":"IL","type":"education","lineage":["https://openalex.org/I52170813"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Or Haim Anidjar","raw_affiliation_strings":["Data Science, Artificial Intelligence Research Center, Ariel University, Ramat HaGolan, Israel","Department of Computer Science, Ariel University, Ariel, IL, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Data Science, Artificial Intelligence Research Center, Ariel University, Ramat HaGolan, Israel","institution_ids":["https://openalex.org/I52170813"]},{"raw_affiliation_string":"Department of Computer Science, Ariel University, Ariel, IL, Israel","institution_ids":["https://openalex.org/I52170813"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002668439","display_name":"Itshak Lapidot","orcid":"https://orcid.org/0000-0003-1066-3441"},"institutions":[{"id":"https://openalex.org/I119096390","display_name":"Afeka College of Engineering","ror":"https://ror.org/05dhprc49","country_code":"IL","type":"education","lineage":["https://openalex.org/I119096390"]},{"id":"https://openalex.org/I198415970","display_name":"Universit\u00e9 d'Avignon et des Pays de Vaucluse","ror":"https://ror.org/00mfpxb84","country_code":"FR","type":"education","lineage":["https://openalex.org/I198415970"]}],"countries":["FR","IL"],"is_corresponding":false,"raw_author_name":"Itshak Lapidot","raw_affiliation_strings":["Afeka Tel-Aviv Academic College of Engineering, ACLP, Tel-Aviv, IL, Israel","Avignon University, Pasteur, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Afeka Tel-Aviv Academic College of Engineering, ACLP, Tel-Aviv, IL, Israel","institution_ids":["https://openalex.org/I119096390"]},{"raw_affiliation_string":"Avignon University, Pasteur, France","institution_ids":["https://openalex.org/I198415970"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023899502","display_name":"Chen Hajaj","orcid":"https://orcid.org/0000-0001-9940-5654"},"institutions":[{"id":"https://openalex.org/I52170813","display_name":"Ariel University","ror":"https://ror.org/03nz8qe97","country_code":"IL","type":"education","lineage":["https://openalex.org/I52170813"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Chen Hajaj","raw_affiliation_strings":["Ariel Cyber Innovation Center, Ariel, IL, Israel","Data Science Artificial Intelligence Research Center, Ariel University, Ramat HaGolan, Israel","Department of Industrial Engineering, Management, Ariel University, Ariel, IL, Israel"],"raw_orcid":"https://orcid.org/0000-0001-9940-5654","affiliations":[{"raw_affiliation_string":"Ariel Cyber Innovation Center, Ariel, IL, Israel","institution_ids":["https://openalex.org/I52170813"]},{"raw_affiliation_string":"Data Science Artificial Intelligence Research Center, Ariel University, Ramat HaGolan, Israel","institution_ids":["https://openalex.org/I52170813"]},{"raw_affiliation_string":"Department of Industrial Engineering, Management, Ariel University, Ariel, IL, Israel","institution_ids":["https://openalex.org/I52170813"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081239516","display_name":"Amit Dvir","orcid":"https://orcid.org/0000-0002-3670-0784"},"institutions":[{"id":"https://openalex.org/I52170813","display_name":"Ariel University","ror":"https://ror.org/03nz8qe97","country_code":"IL","type":"education","lineage":["https://openalex.org/I52170813"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Amit Dvir","raw_affiliation_strings":["Ariel Cyber Innovation Center, Ariel, IL, Israel","Department of Computer Science, Ariel University, Ariel, IL, Israel"],"raw_orcid":"https://orcid.org/0000-0002-3670-0784","affiliations":[{"raw_affiliation_string":"Ariel Cyber Innovation Center, Ariel, IL, Israel","institution_ids":["https://openalex.org/I52170813"]},{"raw_affiliation_string":"Department of Computer Science, Ariel University, Ariel, IL, Israel","institution_ids":["https://openalex.org/I52170813"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017244199","display_name":"Issachar Gilad","orcid":null},"institutions":[{"id":"https://openalex.org/I52170813","display_name":"Ariel University","ror":"https://ror.org/03nz8qe97","country_code":"IL","type":"education","lineage":["https://openalex.org/I52170813"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Issachar Gilad","raw_affiliation_strings":["Department of Industrial Engineering, Management, Ariel University, Ariel, IL, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Industrial Engineering, Management, Ariel University, Ariel, IL, Israel","institution_ids":["https://openalex.org/I52170813"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.1195,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.82167007,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"29","issue":null,"first_page":"2324","last_page":"2338"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.8412555456161499},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8081878423690796},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6770956516265869},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6407827138900757},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5840116739273071},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5425813794136047},{"id":"https://openalex.org/keywords/market-segmentation","display_name":"Market segmentation","score":0.4773564338684082},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46951526403427124},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.4615258276462555},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4434252977371216},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.39636749029159546},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3774378299713135},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.06736505031585693}],"concepts":[{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.8412555456161499},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8081878423690796},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6770956516265869},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6407827138900757},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5840116739273071},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5425813794136047},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.4773564338684082},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46951526403427124},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.4615258276462555},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4434252977371216},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.39636749029159546},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3774378299713135},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.06736505031585693},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2021.3093817","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3093817","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5799999833106995}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":92,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1966142845","https://openalex.org/W2000091716","https://openalex.org/W2010114458","https://openalex.org/W2011797273","https://openalex.org/W2020150184","https://openalex.org/W2042606741","https://openalex.org/W2075662881","https://openalex.org/W2095734449","https://openalex.org/W2106657366","https://openalex.org/W2113386290","https://openalex.org/W2114925438","https://openalex.org/W2114970513","https://openalex.org/W2115599677","https://openalex.org/W2117076645","https://openalex.org/W2130942839","https://openalex.org/W2159591770","https://openalex.org/W2174668315","https://openalex.org/W2289985966","https://openalex.org/W2426479676","https://openalex.org/W2473329891","https://openalex.org/W2605266158","https://openalex.org/W2613904329","https://openalex.org/W2673722796","https://openalex.org/W2726515241","https://openalex.org/W2739041555","https://openalex.org/W2743167696","https://openalex.org/W2786458517","https://openalex.org/W2786672272","https://openalex.org/W2791062765","https://openalex.org/W2803187616","https://openalex.org/W2804758275","https://openalex.org/W2806264589","https://openalex.org/W2889418727","https://openalex.org/W2890825077","https://openalex.org/W2890964092","https://openalex.org/W2896538040","https://openalex.org/W2900130877","https://openalex.org/W2902665437","https://openalex.org/W2902864383","https://openalex.org/W2903877528","https://openalex.org/W2909693411","https://openalex.org/W2913959203","https://openalex.org/W2936539332","https://openalex.org/W2939634425","https://openalex.org/W2962788625","https://openalex.org/W2963227667","https://openalex.org/W2963341956","https://openalex.org/W2963470929","https://openalex.org/W2963745998","https://openalex.org/W2964121744","https://openalex.org/W2964247090","https://openalex.org/W2964265128","https://openalex.org/W2967193527","https://openalex.org/W2970568180","https://openalex.org/W2972073579","https://openalex.org/W2972449503","https://openalex.org/W2973127116","https://openalex.org/W2978352747","https://openalex.org/W3008392149","https://openalex.org/W3010196324","https://openalex.org/W3012958665","https://openalex.org/W3015308613","https://openalex.org/W3015621653","https://openalex.org/W3015783745","https://openalex.org/W3015810999","https://openalex.org/W3015922793","https://openalex.org/W3016112863","https://openalex.org/W3019220537","https://openalex.org/W3025831232","https://openalex.org/W3032959444","https://openalex.org/W3091905774","https://openalex.org/W3095212884","https://openalex.org/W3100703861","https://openalex.org/W3110732916","https://openalex.org/W3210532662","https://openalex.org/W4235151464","https://openalex.org/W4239025696","https://openalex.org/W4294589828","https://openalex.org/W6631190155","https://openalex.org/W6674565674","https://openalex.org/W6677459581","https://openalex.org/W6679436768","https://openalex.org/W6696885005","https://openalex.org/W6737778391","https://openalex.org/W6748447238","https://openalex.org/W6751420435","https://openalex.org/W6768041154","https://openalex.org/W6770434673","https://openalex.org/W6774558098","https://openalex.org/W6779341582","https://openalex.org/W6783596713"],"related_works":["https://openalex.org/W2592395359","https://openalex.org/W2045342254","https://openalex.org/W2535231171","https://openalex.org/W2206035908","https://openalex.org/W2142182663","https://openalex.org/W1501331687","https://openalex.org/W4255512592","https://openalex.org/W2501551404","https://openalex.org/W1493012537","https://openalex.org/W2326647871"],"abstract_inverted_index":{"Speaker":[0,21],"Change":[1],"Detection":[2],"(SCD)":[3],"is":[4,100,146,176],"the":[5,39,43,46,55,61,68,73,84,96,109,121,128,133,137,140,165,170],"task":[6,41],"of":[7,42,63,130],"segmenting":[8,48],"an":[9,125],"input":[10],"audio-recording":[11],"according":[12],"to":[13,164],"speaker":[14,65],"interchanges.":[15],"Nowadays,":[16],"many":[17],"applications,":[18],"such":[19],"as":[20,58,60,169],"Diarization":[22],"(SD)":[23],"or":[24],"automatic":[25],"vocal":[26],"transcription,":[27],"depend":[28],"on":[29,38,139,178],"this":[30,34],"segmentation":[31],"task.":[32],"In":[33],"paper,":[35],"we":[36,90,119,154],"focus":[37],"essential":[40],"SD":[44],"problem,":[45,57],"audio":[47],"process,":[49],"and":[50,71,83,105,108,136,174],"suggest":[51],"a":[52,78,92],"solution":[53,74],"for":[54,67,95],"SCD":[56,97,151],"well":[59],"assignment":[62],"clustered":[64],"labels":[66],"extracted":[69,115],"segments,":[70],"applying":[72],"over":[75],"two":[76,179],"datasets:":[77],"commercial":[79],"dataset":[80,135],"in":[81,127,132],"Hebrew":[82],"ICSI":[85,166],"Meeting":[86,167],"Corpus.":[87],"As":[88],"such,":[89],"propose":[91],"hybrid":[93,159],"framework":[94,160],"problem":[98],"that":[99,112],"learned":[101],"by":[102],"textual":[103],"information":[104],"speech":[106],"signals":[107],"meta-data":[110],"features":[111],"can":[113],"be":[114],"from":[116],"them.":[117],"Moreover,":[118],"demonstrate":[120],"negative":[122],"correlation":[123],"between":[124],"increase":[126],"number":[129],"speakers":[131],"training":[134,173],"influence":[138],"overall":[141],"diarization":[142],"system's":[143],"performance,":[144],"which":[145],"improved":[147],"using":[148],"our":[149,157],"efficient":[150],"component.":[152],"Finally,":[153],"show":[155],"how":[156],"proposed":[158],"remains":[161],"robust":[162],"compared":[163],"Corpus,":[168],"experimental":[171],"evaluation's":[172],"testing":[175],"based":[177],"languages.":[180]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
