{"id":"https://openalex.org/W2305719592","doi":"https://doi.org/10.1109/kst.2016.7440478","title":"A system for popular Thai slang extraction from social media content with n-gram based tokenization","display_name":"A system for popular Thai slang extraction from social media content with n-gram based tokenization","publication_year":2016,"publication_date":"2016-02-01","ids":{"openalex":"https://openalex.org/W2305719592","doi":"https://doi.org/10.1109/kst.2016.7440478","mag":"2305719592"},"language":"en","primary_location":{"id":"doi:10.1109/kst.2016.7440478","is_oa":false,"landing_page_url":"https://doi.org/10.1109/kst.2016.7440478","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 8th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110256683","display_name":"Rachsuda Jiamthapthaksin","orcid":null},"institutions":[{"id":"https://openalex.org/I115748381","display_name":"Assumption University","ror":"https://ror.org/03zmqc707","country_code":"TH","type":"education","lineage":["https://openalex.org/I115748381"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Rachsuda Jiamthapthaksin","raw_affiliation_strings":["Department of Computer Science, Vincent Mary School of Science and Technology Assumption University, Bangkok, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Vincent Mary School of Science and Technology Assumption University, Bangkok, Thailand","institution_ids":["https://openalex.org/I115748381"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073614387","display_name":"Pisal Setthawong","orcid":"https://orcid.org/0000-0003-0197-8409"},"institutions":[{"id":"https://openalex.org/I115748381","display_name":"Assumption University","ror":"https://ror.org/03zmqc707","country_code":"TH","type":"education","lineage":["https://openalex.org/I115748381"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Pisal Setthawong","raw_affiliation_strings":["Department of Business Information Systems, Martin de Tours School of Management and Economics Assumption University, Bangkok, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Business Information Systems, Martin de Tours School of Management and Economics Assumption University, Bangkok, Thailand","institution_ids":["https://openalex.org/I115748381"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045557004","display_name":"Nitipan Ratanasawetwad","orcid":null},"institutions":[{"id":"https://openalex.org/I115748381","display_name":"Assumption University","ror":"https://ror.org/03zmqc707","country_code":"TH","type":"education","lineage":["https://openalex.org/I115748381"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Nitipan Ratanasawetwad","raw_affiliation_strings":["Department of Marketing, Martin de Tours School of Management and Economics Assumption University, Bangkok, Thailand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Marketing, Martin de Tours School of Management and Economics Assumption University, Bangkok, Thailand","institution_ids":["https://openalex.org/I115748381"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I115748381"],"apc_list":null,"apc_paid":null,"fwci":0.8832,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.83413653,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"11","issue":null,"first_page":"130","last_page":"135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9706000089645386,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/slang","display_name":"Slang","score":0.9622630476951599},{"id":"https://openalex.org/keywords/lexical-analysis","display_name":"Lexical analysis","score":0.7686195373535156},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6989021301269531},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6504215002059937},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.5987977385520935},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42413920164108276},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3769937753677368},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.36305832862854004},{"id":"https://openalex.org/keywords/internet-privacy","display_name":"Internet privacy","score":0.3312460780143738},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3295596241950989},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.16038119792938232},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.12198913097381592}],"concepts":[{"id":"https://openalex.org/C2779901982","wikidata":"https://www.wikidata.org/wiki/Q8102","display_name":"Slang","level":2,"score":0.9622630476951599},{"id":"https://openalex.org/C176982825","wikidata":"https://www.wikidata.org/wiki/Q835922","display_name":"Lexical analysis","level":2,"score":0.7686195373535156},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6989021301269531},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6504215002059937},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.5987977385520935},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42413920164108276},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3769937753677368},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.36305832862854004},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.3312460780143738},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3295596241950989},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.16038119792938232},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.12198913097381592},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/kst.2016.7440478","is_oa":false,"landing_page_url":"https://doi.org/10.1109/kst.2016.7440478","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 8th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7900000214576721,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W31502041","https://openalex.org/W36611794","https://openalex.org/W1574972022","https://openalex.org/W1975428268","https://openalex.org/W2005045777","https://openalex.org/W2020472611","https://openalex.org/W2078714787","https://openalex.org/W2128808215","https://openalex.org/W2136528950","https://openalex.org/W2203825473","https://openalex.org/W2251986772","https://openalex.org/W2274323834","https://openalex.org/W6678961370","https://openalex.org/W6691516209","https://openalex.org/W7038540887"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2492617563","https://openalex.org/W2480261505","https://openalex.org/W4206388121","https://openalex.org/W2900572605","https://openalex.org/W2305719592","https://openalex.org/W2068143774","https://openalex.org/W4241525818","https://openalex.org/W2029097226","https://openalex.org/W2394613339"],"abstract_inverted_index":{"With":[0],"increased":[1,27],"penetration":[2],"of":[3,29,40,63,98,100,147],"smart":[4],"devices":[5],"and":[6,20,53,78,120,127,149,167,191],"internet":[7],"connectivity,":[8],"many":[9,102],"Thais":[10],"are":[11,47,60,125,188],"more":[12],"readily":[13],"engaged":[14],"in":[15,43,76,86,118,141],"social":[16,30,104,115,164],"media,":[17],"online":[18,138],"forums,":[19],"chat":[21],"groups.":[22],"As":[23,89,123],"there":[24,33],"is":[25,34,82,109,132],"an":[26,137,155],"consumption":[28,39],"media":[31,58,105,116,165],"content,":[32],"a":[35,61,170],"shift":[36],"from":[37],"the":[38,64,90,112,145],"traditional":[41,54],"medias":[42],"which":[44,81,142],"formal":[45],"language":[46,80],"used":[48],"regularly":[49],"such":[50],"as":[51],"broadcast":[52],"print":[55],"medias.":[56],"Social":[57],"posts":[59,67,166],"reflection":[62],"trend,":[65],"where":[66],"usually":[68,73,133],"made":[69],"by":[70,162,181],"younger":[71],"generations":[72],"involve":[74],"communication":[75],"slang":[77,119,124,161,193],"non-formal":[79],"not":[83],"typically":[84],"available":[85],"formalized":[87],"dictionaries.":[88],"Thai":[91,103,160],"population":[92],"like":[93],"to":[94,110,135,174,185],"follow":[95,111],"trends,":[96],"one":[97],"behaviors":[99],"that":[101,157],"users":[106],"engage":[107],"in,":[108],"latest":[113],"popular":[114,150,159,192],"trends":[117,146],"word":[121],"usage.":[122],"changed":[126],"evolved":[128],"over":[129],"time,":[130],"it":[131,180],"useful":[134],"have":[136],"mining":[139],"tool":[140],"could":[143],"capture":[144],"emerging":[148],"slang.":[151],"This":[152],"paper":[153],"proposes":[154],"approach":[156,173,184],"extracts":[158],"comparing":[163],"utilizing":[168],"tokenization,":[169],"dictionary":[171],"based":[172],"extract":[175],"unknown":[176],"words,":[177],"before":[178],"expanding":[179],"using":[182],"n-gram":[183],"figure":[186],"what":[187],"currently":[189],"trending":[190],"words.":[194]},"counts_by_year":[{"year":2023,"cited_by_count":3},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
