{"id":"https://openalex.org/W4409872469","doi":"https://doi.org/10.1162/tacl_a_00745","title":"The Thai Universal Dependency Treebank","display_name":"The Thai Universal Dependency Treebank","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4409872469","doi":"https://doi.org/10.1162/tacl_a_00745"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00745","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00745","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00745/2514583/tacl_a_00745.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00745/2514583/tacl_a_00745.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093321372","display_name":"Panyut Sriwirote","orcid":"https://orcid.org/0009-0007-0296-4275"},"institutions":[{"id":"https://openalex.org/I158708052","display_name":"Chulalongkorn University","ror":"https://ror.org/028wp3y58","country_code":"TH","type":"education","lineage":["https://openalex.org/I158708052"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Panyut Sriwirote","raw_affiliation_strings":["Department of Linguistics, Chulalongkorn University, Thailand. panyutsriwirote@gmail.com"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Chulalongkorn University, Thailand. panyutsriwirote@gmail.com","institution_ids":["https://openalex.org/I158708052"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038370332","display_name":"Wei Qi Leong","orcid":"https://orcid.org/0009-0002-0645-1112"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei Qi Leong","raw_affiliation_strings":["AI Singapore, Singapore. weiqi@aisingapore.org"],"affiliations":[{"raw_affiliation_string":"AI Singapore, Singapore. weiqi@aisingapore.org","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001689161","display_name":"Charin Polpanumas","orcid":"https://orcid.org/0000-0001-7822-4600"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Charin Polpanumas","raw_affiliation_strings":["Amazon, Japan. cebril@gmail.com"],"affiliations":[{"raw_affiliation_string":"Amazon, Japan. cebril@gmail.com","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048271631","display_name":"Santhawat Thanyawong","orcid":null},"institutions":[{"id":"https://openalex.org/I131868736","display_name":"Prince of Songkla University","ror":"https://ror.org/0575ycz84","country_code":"TH","type":"education","lineage":["https://openalex.org/I131868736"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Santhawat Thanyawong","raw_affiliation_strings":["Faculty of Humanities and Social Sciences, Prince of Songkla University, Thailand. santhawat.t@psu.ac.th"],"affiliations":[{"raw_affiliation_string":"Faculty of Humanities and Social Sciences, Prince of Songkla University, Thailand. santhawat.t@psu.ac.th","institution_ids":["https://openalex.org/I131868736"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086528347","display_name":"William Chandra Tjhi","orcid":"https://orcid.org/0009-0009-9861-3545"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"William Chandra Tjhi","raw_affiliation_strings":["AI Singapore, Singapore. wtjhi@aisingapore.org"],"affiliations":[{"raw_affiliation_string":"AI Singapore, Singapore. wtjhi@aisingapore.org","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062206645","display_name":"Wirote Aroonmanakun","orcid":null},"institutions":[{"id":"https://openalex.org/I158708052","display_name":"Chulalongkorn University","ror":"https://ror.org/028wp3y58","country_code":"TH","type":"education","lineage":["https://openalex.org/I158708052"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Wirote Aroonmanakun","raw_affiliation_strings":["Department of Linguistics, Chulalongkorn University, Thailand. awirote@chula.ac.th"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Chulalongkorn University, Thailand. awirote@chula.ac.th","institution_ids":["https://openalex.org/I158708052"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008312239","display_name":"Attapol Rutherford","orcid":"https://orcid.org/0000-0003-2270-6082"},"institutions":[{"id":"https://openalex.org/I158708052","display_name":"Chulalongkorn University","ror":"https://ror.org/028wp3y58","country_code":"TH","type":"education","lineage":["https://openalex.org/I158708052"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Attapol T. Rutherford","raw_affiliation_strings":["Department of Linguistics, Chulalongkorn University, Thailand attapol. attapol.t"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Chulalongkorn University, Thailand attapol. attapol.t","institution_ids":["https://openalex.org/I158708052"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5093321372"],"corresponding_institution_ids":["https://openalex.org/I158708052"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04084838,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"376","last_page":"391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9765999913215637,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/treebank","display_name":"Treebank","score":0.9789458513259888},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8270986080169678},{"id":"https://openalex.org/keywords/dependency","display_name":"Dependency (UML)","score":0.8041701912879944},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6092185974121094},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5080127716064453},{"id":"https://openalex.org/keywords/dependency-grammar","display_name":"Dependency grammar","score":0.41103675961494446},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.32332128286361694}],"concepts":[{"id":"https://openalex.org/C206134035","wikidata":"https://www.wikidata.org/wiki/Q811525","display_name":"Treebank","level":3,"score":0.9789458513259888},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8270986080169678},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.8041701912879944},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6092185974121094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5080127716064453},{"id":"https://openalex.org/C164883195","wikidata":"https://www.wikidata.org/wiki/Q674834","display_name":"Dependency grammar","level":3,"score":0.41103675961494446},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.32332128286361694}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1162/tacl_a_00745","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00745","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00745/2514583/tacl_a_00745.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00745","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00745","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00745/2514583/tacl_a_00745.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3034753964","display_name":null,"funder_award_id":"grant","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409872469.pdf","grobid_xml":"https://content.openalex.org/works/W4409872469.grobid-xml"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W1607035479","https://openalex.org/W2045384855","https://openalex.org/W2053154970","https://openalex.org/W2094624848","https://openalex.org/W2105847779","https://openalex.org/W2340253197","https://openalex.org/W2552110825","https://openalex.org/W2618735189","https://openalex.org/W2740840489","https://openalex.org/W2752392399","https://openalex.org/W2899024931","https://openalex.org/W2915977242","https://openalex.org/W2917956622","https://openalex.org/W2953359159","https://openalex.org/W2963021447","https://openalex.org/W2963106122","https://openalex.org/W2963341956","https://openalex.org/W2963370123","https://openalex.org/W2965373594","https://openalex.org/W2969873034","https://openalex.org/W2970529259","https://openalex.org/W2986154550","https://openalex.org/W2996052604","https://openalex.org/W3011573503","https://openalex.org/W3013703241","https://openalex.org/W3035058125","https://openalex.org/W3101226838","https://openalex.org/W3103187652","https://openalex.org/W3105033018","https://openalex.org/W3133551016","https://openalex.org/W3156159991","https://openalex.org/W3174505712","https://openalex.org/W3207806388","https://openalex.org/W4229839837","https://openalex.org/W4287370843","https://openalex.org/W4297801177","https://openalex.org/W4319334880","https://openalex.org/W4381162709","https://openalex.org/W4388927863","https://openalex.org/W6629386296","https://openalex.org/W6675420493","https://openalex.org/W6686234212","https://openalex.org/W6703978569","https://openalex.org/W6949947755","https://openalex.org/W7024746193"],"related_works":["https://openalex.org/W4225089174","https://openalex.org/W2251234095","https://openalex.org/W2251015434","https://openalex.org/W4212832296","https://openalex.org/W2577569078","https://openalex.org/W2576044174","https://openalex.org/W2180950424","https://openalex.org/W1987996389","https://openalex.org/W2940288729","https://openalex.org/W3135607784"],"abstract_inverted_index":{"Abstract":[0],"Automatic":[1],"dependency":[2,18,22,72,97,124],"parsing":[3,73],"of":[4,15,27,31,57,102,115],"Thai":[5,17,47,54,96,123],"sentences":[6],"has":[7],"been":[8],"underexplored,":[9],"as":[10],"evidenced":[11],"by":[12,44],"the":[13,25,46,63,91,103],"lack":[14,26,114],"large":[16],"treebanks":[19],"with":[20],"complete":[21],"structures":[23],"and":[24,81,87,113],"a":[28,52],"published":[29],"evaluation":[30],"state-of-the-art":[32,85],"models,":[33],"especially":[34],"transformer-based":[35],"parsers.":[36],"In":[37],"this":[38],"work,":[39],"we":[40],"addressed":[41],"these":[42],"gaps":[43],"introducing":[45],"Universal":[48,64],"Dependency":[49],"Treebank":[50],"(TUD),":[51],"new":[53],"treebank":[55],"consisting":[56],"3,627":[58],"trees":[59],"annotated":[60],"according":[61],"to":[62],"Dependencies":[65],"(UD)":[66],"framework.":[67],"We":[68],"then":[69],"benchmarked":[70],"92":[71],"models":[74,104],"that":[75,107],"incorporate":[76],"pretrained":[77],"transformers":[78],"on":[79,90],"Thai-PUD":[80],"our":[82],"TUD,":[83],"achieving":[84],"results":[86],"shedding":[88],"light":[89],"optimal":[92],"model":[93],"components":[94],"for":[95,122],"parsing.":[98,125],"Our":[99],"error":[100],"analysis":[101],"also":[105],"reveals":[106],"polyfunctional":[108],"words,":[109],"serial":[110],"verb":[111],"construction,":[112],"rich":[116],"morphosyntactic":[117],"features":[118],"present":[119],"main":[120],"challenges":[121]},"counts_by_year":[],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2025-10-10T00:00:00"}
