{"id":"https://openalex.org/W1965276979","doi":"https://doi.org/10.1109/coginfocom.2013.6719169","title":"Language independent automatic speech segmentation into phoneme-like units on the base of acoustic distinctive features","display_name":"Language independent automatic speech segmentation into phoneme-like units on the base of acoustic distinctive features","publication_year":2013,"publication_date":"2013-12-01","ids":{"openalex":"https://openalex.org/W1965276979","doi":"https://doi.org/10.1109/coginfocom.2013.6719169","mag":"1965276979"},"language":"en","primary_location":{"id":"doi:10.1109/coginfocom.2013.6719169","is_oa":false,"landing_page_url":"https://doi.org/10.1109/coginfocom.2013.6719169","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 4th International Conference on Cognitive Infocommunications (CogInfoCom)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091684390","display_name":"G\u00e1bor Kiss","orcid":"https://orcid.org/0000-0002-0447-9376"},"institutions":[{"id":"https://openalex.org/I29770179","display_name":"Budapest University of Technology and Economics","ror":"https://ror.org/02w42ss30","country_code":"HU","type":"education","lineage":["https://openalex.org/I29770179"]}],"countries":["HU"],"is_corresponding":true,"raw_author_name":"Gabor Kiss","raw_affiliation_strings":["Department of Telecommunication and Media Informatics, Budapest University of Technology and Economics, Budapest, Hungary","Dept. of Telecommun. & Media Inf., Budapest Univ. of Technol. & Econ., Budapest, Hungary"],"affiliations":[{"raw_affiliation_string":"Department of Telecommunication and Media Informatics, Budapest University of Technology and Economics, Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]},{"raw_affiliation_string":"Dept. of Telecommun. & Media Inf., Budapest Univ. of Technol. & Econ., Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083596812","display_name":"D\u00e1vid Sztah\u00f3","orcid":"https://orcid.org/0000-0002-7361-4260"},"institutions":[{"id":"https://openalex.org/I29770179","display_name":"Budapest University of Technology and Economics","ror":"https://ror.org/02w42ss30","country_code":"HU","type":"education","lineage":["https://openalex.org/I29770179"]}],"countries":["HU"],"is_corresponding":false,"raw_author_name":"David Sztaho","raw_affiliation_strings":["Department of Telecommunication and Media Informatics, Budapest University of Technology and Economics, Budapest, Hungary","Dept. of Telecommun. & Media Inf., Budapest Univ. of Technol. & Econ., Budapest, Hungary"],"affiliations":[{"raw_affiliation_string":"Department of Telecommunication and Media Informatics, Budapest University of Technology and Economics, Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]},{"raw_affiliation_string":"Dept. of Telecommun. & Media Inf., Budapest Univ. of Technol. & Econ., Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088818569","display_name":"Kl\u00e1ra Vicsi","orcid":"https://orcid.org/0000-0002-7828-6833"},"institutions":[{"id":"https://openalex.org/I29770179","display_name":"Budapest University of Technology and Economics","ror":"https://ror.org/02w42ss30","country_code":"HU","type":"education","lineage":["https://openalex.org/I29770179"]}],"countries":["HU"],"is_corresponding":false,"raw_author_name":"Klara Vicsi","raw_affiliation_strings":["Department of Telecommunication and Media Informatics, Budapest University of Technology and Economics, Budapest, Hungary","Dept. of Telecommun. & Media Inf., Budapest Univ. of Technol. & Econ., Budapest, Hungary"],"affiliations":[{"raw_affiliation_string":"Department of Telecommunication and Media Informatics, Budapest University of Technology and Economics, Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]},{"raw_affiliation_string":"Dept. of Telecommun. & Media Inf., Budapest Univ. of Technol. & Econ., Budapest, Hungary","institution_ids":["https://openalex.org/I29770179"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5091684390"],"corresponding_institution_ids":["https://openalex.org/I29770179"],"apc_list":null,"apc_paid":null,"fwci":3.3663,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.92235252,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"579","last_page":"582"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8067749738693237},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8025287985801697},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7708593606948853},{"id":"https://openalex.org/keywords/speech-segmentation","display_name":"Speech segmentation","score":0.7456183433532715},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.702826738357544},{"id":"https://openalex.org/keywords/timit","display_name":"TIMIT","score":0.6768485307693481},{"id":"https://openalex.org/keywords/german","display_name":"German","score":0.5399136543273926},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.5284179449081421},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.483148992061615},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4755682349205017},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.46875452995300293},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.44738155603408813},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.43483108282089233},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.38967469334602356},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3221356272697449},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.2787707448005676},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10349616408348083}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8067749738693237},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8025287985801697},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7708593606948853},{"id":"https://openalex.org/C207030507","wikidata":"https://www.wikidata.org/wiki/Q2266173","display_name":"Speech segmentation","level":3,"score":0.7456183433532715},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.702826738357544},{"id":"https://openalex.org/C2778724510","wikidata":"https://www.wikidata.org/wiki/Q7670405","display_name":"TIMIT","level":3,"score":0.6768485307693481},{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.5399136543273926},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.5284179449081421},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.483148992061615},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4755682349205017},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.46875452995300293},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44738155603408813},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.43483108282089233},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.38967469334602356},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3221356272697449},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.2787707448005676},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10349616408348083},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/coginfocom.2013.6719169","is_oa":false,"landing_page_url":"https://doi.org/10.1109/coginfocom.2013.6719169","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 4th International Conference on Cognitive Infocommunications (CogInfoCom)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6299999952316284}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1044918152","https://openalex.org/W1517164593","https://openalex.org/W1982021240","https://openalex.org/W2170896775","https://openalex.org/W2357221934","https://openalex.org/W2401426213","https://openalex.org/W2619993508","https://openalex.org/W3127686677","https://openalex.org/W4285719527","https://openalex.org/W6630934903","https://openalex.org/W6789826613"],"related_works":["https://openalex.org/W3127686677","https://openalex.org/W2413040788","https://openalex.org/W2048014685","https://openalex.org/W80423236","https://openalex.org/W2969683168","https://openalex.org/W2808291730","https://openalex.org/W2140130847","https://openalex.org/W2140385934","https://openalex.org/W4288256886","https://openalex.org/W2057635330"],"abstract_inverted_index":{"There":[0],"are":[1],"special":[2],"topics":[3,16],"in":[4,71],"cognitive":[5],"infocommunications":[6],"where":[7],"the":[8,19,35,45,63,87,113],"processing":[9],"of":[10,21,30,47,66,89],"continuous":[11,90],"speech":[12,22,40,67,91],"is":[13,32],"necessary.":[14],"These":[15],"often":[17],"require":[18],"segmentation":[20,31,88,100,114],"signal":[23],"into":[24,92],"phoneme":[25],"sized":[26],"units.":[27],"This":[28],"kind":[29],"necessary,":[33],"when":[34],"desired":[36],"behavior":[37],"depends":[38],"on":[39,62,86],"timing,":[41],"like":[42],"rhythm":[43],"or":[44,51],"place":[46],"voiced":[48],"sounds":[49],"(emotion":[50],"mood":[52],"detection,":[53],"language":[54,73,82],"learning,":[55],"acoustic":[56],"feature":[57],"visualization).":[58],"Segmentation":[59],"systems":[60],"based":[61,85],"acoustic-phonetic":[64],"knowledge":[65],"could":[68],"be":[69],"realized":[70],"a":[72,81],"independent":[74,83],"way.":[75],"In":[76],"this":[77],"paper":[78],"we":[79],"introduce":[80],"solution,":[84],"9":[93],"broad":[94],"phonetic":[95],"classes.":[96],"The":[97],"classification":[98],"and":[99,120],"was":[101,128],"prepared":[102],"using":[103],"Hidden":[104],"Markov":[105],"Models.":[106],"Three":[107],"databases":[108],"were":[109],"used":[110],"to":[111],"evaluate":[112],"systems:":[115],"Hungarian":[116],"MRBA,":[117],"German":[118],"KIEL":[119],"English":[121],"TIMIT":[122],"databases.":[123],"80%":[124],"average":[125],"recognition":[126],"result":[127],"obtained.":[129]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
