{"id":"https://openalex.org/W2405954614","doi":"https://doi.org/10.21437/eurospeech.1999-306","title":"Detection of speaker changes in an audio document","display_name":"Detection of speaker changes in an audio document","publication_year":1999,"publication_date":"1999-09-05","ids":{"openalex":"https://openalex.org/W2405954614","doi":"https://doi.org/10.21437/eurospeech.1999-306","mag":"2405954614"},"language":"en","primary_location":{"id":"doi:10.21437/eurospeech.1999-306","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.1999-306","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th European Conference on Speech Communication and Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010939305","display_name":"Perrine Delacourt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Perrine Delacourt","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089616387","display_name":"David Kryze","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"David Kryze","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5108525230","display_name":"C. Wellekens","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Christian J. Wellekens","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.3410596,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1195","last_page":"1198"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8237299919128418},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.6878169775009155},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6667388081550598},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.516918420791626},{"id":"https://openalex.org/keywords/acoustic-model","display_name":"Acoustic model","score":0.49125999212265015},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.4667304754257202},{"id":"https://openalex.org/keywords/tree-structure","display_name":"Tree structure","score":0.4382164776325226},{"id":"https://openalex.org/keywords/incremental-decision-tree","display_name":"Incremental decision tree","score":0.425252765417099},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4222663938999176},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.4221011996269226},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4031454920768738},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39110180735588074},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37855982780456543},{"id":"https://openalex.org/keywords/decision-tree-learning","display_name":"Decision tree learning","score":0.36846208572387695},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3492441773414612},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34102657437324524},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2735971212387085},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.1937844455242157},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.11900591850280762},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09333354234695435}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8237299919128418},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.6878169775009155},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6667388081550598},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.516918420791626},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.49125999212265015},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.4667304754257202},{"id":"https://openalex.org/C163797641","wikidata":"https://www.wikidata.org/wiki/Q2067937","display_name":"Tree structure","level":3,"score":0.4382164776325226},{"id":"https://openalex.org/C10229987","wikidata":"https://www.wikidata.org/wiki/Q17083028","display_name":"Incremental decision tree","level":4,"score":0.425252765417099},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4222663938999176},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.4221011996269226},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4031454920768738},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39110180735588074},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37855982780456543},{"id":"https://openalex.org/C5481197","wikidata":"https://www.wikidata.org/wiki/Q16766476","display_name":"Decision tree learning","level":3,"score":0.36846208572387695},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3492441773414612},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34102657437324524},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2735971212387085},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.1937844455242157},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11900591850280762},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09333354234695435},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C197855036","wikidata":"https://www.wikidata.org/wiki/Q380172","display_name":"Binary tree","level":2,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/eurospeech.1999-306","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.1999-306","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th European Conference on Speech Communication and Technology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.800000011920929}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W130623727","https://openalex.org/W137969146","https://openalex.org/W182969254","https://openalex.org/W198801378","https://openalex.org/W1555410120","https://openalex.org/W1594031697","https://openalex.org/W1926823873","https://openalex.org/W2108341231","https://openalex.org/W2158069733","https://openalex.org/W2276283915","https://openalex.org/W2603454388","https://openalex.org/W3085162807"],"related_works":["https://openalex.org/W2030894524","https://openalex.org/W1982169401","https://openalex.org/W1648970942","https://openalex.org/W2811372817","https://openalex.org/W2120748120","https://openalex.org/W2545418239","https://openalex.org/W2591672004","https://openalex.org/W4243803609","https://openalex.org/W4319437832","https://openalex.org/W2350430350"],"abstract_inverted_index":{"Phonetic":[0],"decision-tree":[1,105],"based":[2,106],"acoustic":[3,37],"modeling":[4],"has":[5],"been":[6],"widely":[7],"used":[8],"in":[9,20],"speech":[10],"recognition":[11],"systems.":[12],"However,":[13],"the":[14,21,33,36,64,77,83,86,103,110,129],"assumption":[15],"that":[16,116],"all":[17],"states":[18],"clustered":[19],"same":[22],"leaf":[23],"node":[24],"share":[25],"both":[26],"their":[27],"Gaussians":[28],"and":[29,62,67,88],"mixture":[30],"weights":[31],"restricts":[32],"improvement":[34],"of":[35,59,79,85],"models.":[38],"In":[39],"this":[40,52],"paper,":[41],"we":[42,54,93],"propose":[43],"a":[44,48,122],"new":[45],"structure":[46,53],"called":[47],"two-level":[49],"decisiontree.":[50],"With":[51],"can":[55,94,119],"make":[56],"better":[57,96],"use":[58],"training":[60],"data":[61],"improve":[63],"model":[65],"accuracy":[66],"robustness.":[68],"Two-level":[69],"decision":[70],"trees":[71],"provide":[72],"more":[73],"flexibility":[74],"to":[75],"control":[76],"number":[78],"parameters.":[80],"By":[81],"tuning":[82],"balance":[84],"first":[87],"second":[89],"level":[90],"tree":[91],"nodes,":[92],"get":[95],"performance":[97],"with":[98],"even":[99],"fewer":[100],"parameters":[101],"than":[102],"traditional":[104],"approach.":[107,131],"Experiments":[108],"on":[109],"Wall":[111],"Street":[112],"Journal":[113],"tasks":[114],"show":[115],"our":[117],"approach":[118],"achieve":[120],"about":[121],"10%":[123],"word":[124],"error":[125],"rate":[126],"reduction":[127],"over":[128],"conventional":[130]},"counts_by_year":[{"year":2018,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2016-06-24T00:00:00"}
