{"id":"https://openalex.org/W2592584157","doi":"https://doi.org/10.1186/s13636-017-0102-8","title":"Statistical analysis of orthographic and phonemic language corpus for word-based and phoneme-based Polish language modelling","display_name":"Statistical analysis of orthographic and phonemic language corpus for word-based and phoneme-based Polish language modelling","publication_year":2017,"publication_date":"2017-02-28","ids":{"openalex":"https://openalex.org/W2592584157","doi":"https://doi.org/10.1186/s13636-017-0102-8","mag":"2592584157"},"language":"en","primary_location":{"id":"doi:10.1186/s13636-017-0102-8","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-017-0102-8","pdf_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-017-0102-8","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-017-0102-8","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073804552","display_name":"Piotr K\u0142osowski","orcid":"https://orcid.org/0000-0002-1275-4147"},"institutions":[{"id":"https://openalex.org/I119004910","display_name":"Silesian University of Technology","ror":"https://ror.org/02dyjk442","country_code":"PL","type":"education","lineage":["https://openalex.org/I119004910"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Piotr K\u0142osowski","raw_affiliation_strings":["Department of Electronics, Faculty of Automatic Control, Electronics and Computer Science, Silesian University of Technology, Akademicka 16, Gliwice, 44-100, Poland"],"affiliations":[{"raw_affiliation_string":"Department of Electronics, Faculty of Automatic Control, Electronics and Computer Science, Silesian University of Technology, Akademicka 16, Gliwice, 44-100, Poland","institution_ids":["https://openalex.org/I119004910"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5073804552"],"corresponding_institution_ids":["https://openalex.org/I119004910"],"apc_list":{"value":1115,"currency":"GBP","value_usd":1367},"apc_paid":{"value":1115,"currency":"GBP","value_usd":1367},"fwci":5.9527,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.96067756,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"2017","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12658","display_name":"Language and Culture","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12658","display_name":"Language and Culture","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13707","display_name":"Literature, Language, and Rhetoric Studies","score":0.9871000051498413,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9650999903678894,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7627565860748291},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6197428107261658},{"id":"https://openalex.org/keywords/orthographic-projection","display_name":"Orthographic projection","score":0.5676751732826233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5195153951644897},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4986398220062256},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.46807584166526794},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.4593193531036377},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.4482637643814087},{"id":"https://openalex.org/keywords/corpus-linguistics","display_name":"Corpus linguistics","score":0.42960697412490845},{"id":"https://openalex.org/keywords/cache-language-model","display_name":"Cache language model","score":0.42772629857063293},{"id":"https://openalex.org/keywords/statistical-analysis","display_name":"Statistical analysis","score":0.4103170931339264},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3525206446647644},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.2731563448905945},{"id":"https://openalex.org/keywords/universal-networking-language","display_name":"Universal Networking Language","score":0.2552992105484009},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.14436018466949463},{"id":"https://openalex.org/keywords/comprehension-approach","display_name":"Comprehension approach","score":0.12682726979255676},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09473782777786255}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7627565860748291},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6197428107261658},{"id":"https://openalex.org/C175694140","wikidata":"https://www.wikidata.org/wiki/Q980329","display_name":"Orthographic projection","level":2,"score":0.5676751732826233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5195153951644897},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4986398220062256},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.46807584166526794},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.4593193531036377},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4482637643814087},{"id":"https://openalex.org/C532629269","wikidata":"https://www.wikidata.org/wiki/Q865083","display_name":"Corpus linguistics","level":2,"score":0.42960697412490845},{"id":"https://openalex.org/C39608478","wikidata":"https://www.wikidata.org/wiki/Q5015979","display_name":"Cache language model","level":5,"score":0.42772629857063293},{"id":"https://openalex.org/C2986587452","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical analysis","level":2,"score":0.4103170931339264},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3525206446647644},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2731563448905945},{"id":"https://openalex.org/C83479923","wikidata":"https://www.wikidata.org/wiki/Q2063748","display_name":"Universal Networking Language","level":4,"score":0.2552992105484009},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.14436018466949463},{"id":"https://openalex.org/C129353971","wikidata":"https://www.wikidata.org/wiki/Q5156949","display_name":"Comprehension approach","level":3,"score":0.12682726979255676},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09473782777786255},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1186/s13636-017-0102-8","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-017-0102-8","pdf_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-017-0102-8","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1186/s13636-017-0102-8","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-017-0102-8","pdf_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-017-0102-8","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7300000190734863}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2592584157.pdf","grobid_xml":"https://content.openalex.org/works/W2592584157.grobid-xml"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W15523229","https://openalex.org/W15779796","https://openalex.org/W44059908","https://openalex.org/W169008908","https://openalex.org/W398115157","https://openalex.org/W404695663","https://openalex.org/W1003348853","https://openalex.org/W1024780720","https://openalex.org/W1482958624","https://openalex.org/W1507719567","https://openalex.org/W1508165687","https://openalex.org/W1513168562","https://openalex.org/W1518948183","https://openalex.org/W1527014113","https://openalex.org/W1562736752","https://openalex.org/W1595187495","https://openalex.org/W1606884126","https://openalex.org/W1663984431","https://openalex.org/W1868795753","https://openalex.org/W1898164463","https://openalex.org/W1913261780","https://openalex.org/W1959176866","https://openalex.org/W1967461618","https://openalex.org/W1970689298","https://openalex.org/W1977323050","https://openalex.org/W1997658820","https://openalex.org/W2010436475","https://openalex.org/W2025221376","https://openalex.org/W2027276499","https://openalex.org/W2048176942","https://openalex.org/W2079656678","https://openalex.org/W2080213370","https://openalex.org/W2099111195","https://openalex.org/W2105638720","https://openalex.org/W2134182172","https://openalex.org/W2135153490","https://openalex.org/W2135869163","https://openalex.org/W2139799434","https://openalex.org/W2163829421","https://openalex.org/W2166221226","https://openalex.org/W2166850712","https://openalex.org/W2286739582","https://openalex.org/W2397798422","https://openalex.org/W2494935878","https://openalex.org/W2513592917","https://openalex.org/W2560793587","https://openalex.org/W2602331152","https://openalex.org/W3144203334","https://openalex.org/W4250450525","https://openalex.org/W4254972968","https://openalex.org/W4256617900","https://openalex.org/W4388400684","https://openalex.org/W6627465322"],"related_works":["https://openalex.org/W4255155614","https://openalex.org/W2394860946","https://openalex.org/W761725120","https://openalex.org/W2009170886","https://openalex.org/W2071315630","https://openalex.org/W2897427480","https://openalex.org/W2787311093","https://openalex.org/W1508853749","https://openalex.org/W1745277","https://openalex.org/W2147766635"],"abstract_inverted_index":{"This":[0],"article":[1],"presents":[2],"the":[3,13,32,39,48,56,78],"original":[4],"results":[5],"of":[6,31,42,58,64,74,77,96,121],"Polish":[7,23,43,52,65],"language":[8,17,20,35,66,70,82,90,107,113],"statistical":[9,62,98,103],"analysis,":[10,99],"based":[11,67],"on":[12,68],"orthographic":[14,34,79],"and":[15,80,105],"phonemic":[16,59,69,81],"corpus.":[18],"Phonemic":[19],"corpus":[21,46],"for":[22,109,125],"was":[24],"developed":[25],"by":[26],"using":[27],"automatic":[28,122],"grapheme-to-phoneme":[29],"conversion":[30],"source":[33],"corpus,":[36,71],"obtained":[37,92],"from":[38],"National":[40],"Corpus":[41],"(NCP).":[44],"The":[45],"contains":[47],"most":[49],"frequently":[50],"used":[51],"words,":[53],"written":[54],"with":[55],"use":[57],"notation.":[60],"Performed":[61],"analysis":[63],"includes":[72],"frequency":[73],"occurrence":[75],"calculation":[76],"components,":[83],"as":[84,86,93],"well":[85],"their":[87],"sequence.":[88],"Statistical":[89],"data,":[91],"a":[94],"result":[95],"performed":[97],"enable":[100],"to":[101,118],"develop":[102],"word-based":[104],"phoneme-based":[106],"models":[108,114],"Polish.":[110,126],"Applying":[111],"these":[112],"can":[115],"effectively":[116],"contribute":[117],"efficiency":[119],"improvement":[120],"speech":[123],"recognition":[124]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
