{"id":"https://openalex.org/W3015144506","doi":"https://doi.org/10.1145/3380967","title":"Improving Code-mixed POS Tagging Using Code-mixed Embeddings","display_name":"Improving Code-mixed POS Tagging Using Code-mixed Embeddings","publication_year":2020,"publication_date":"2020-03-29","ids":{"openalex":"https://openalex.org/W3015144506","doi":"https://doi.org/10.1145/3380967","mag":"3015144506"},"language":"en","primary_location":{"id":"doi:10.1145/3380967","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3380967","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108784869","display_name":"S. Nagesh Bhattu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153924","display_name":"National Institute of Technology Andhra Pradesh","ror":"https://ror.org/0456pcg54","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210153924"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"S. Nagesh Bhattu","raw_affiliation_strings":["National Institute of Technology Andhra Pradesh, Andhra Pradesh, India"],"affiliations":[{"raw_affiliation_string":"National Institute of Technology Andhra Pradesh, Andhra Pradesh, India","institution_ids":["https://openalex.org/I4210153924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067954912","display_name":"Satya Krishna Nunna","orcid":"https://orcid.org/0000-0001-7827-8393"},"institutions":[{"id":"https://openalex.org/I4210153924","display_name":"National Institute of Technology Andhra Pradesh","ror":"https://ror.org/0456pcg54","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210153924"]},{"id":"https://openalex.org/I150312865","display_name":"Institute for Development and Research in Banking Technology","ror":"https://ror.org/00ta0g865","country_code":"IN","type":"government","lineage":["https://openalex.org/I150312865"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Satya Krishna Nunna","raw_affiliation_strings":["IDRBT and National Institute of Technology, Andhra Pradesh, India"],"affiliations":[{"raw_affiliation_string":"IDRBT and National Institute of Technology, Andhra Pradesh, India","institution_ids":["https://openalex.org/I150312865","https://openalex.org/I4210153924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111965646","display_name":"D. V. L. N. Somayajulu","orcid":null},"institutions":[{"id":"https://openalex.org/I207223250","display_name":"Indian Institute of Information Technology Design and Manufacturing Jabalpur","ror":"https://ror.org/00gmd7q80","country_code":"IN","type":"education","lineage":["https://openalex.org/I207223250"]},{"id":"https://openalex.org/I121750182","display_name":"National Institute of Technology Warangal","ror":"https://ror.org/017ebfz38","country_code":"IN","type":"education","lineage":["https://openalex.org/I121750182"]},{"id":"https://openalex.org/I39244652","display_name":"Indian Institute of Information Technology, Design and Manufacturing, Kancheepuram","ror":"https://ror.org/023c9pb11","country_code":"IN","type":"education","lineage":["https://openalex.org/I39244652"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"D. V. L. N. Somayajulu","raw_affiliation_strings":["National Institute of Technology and IIITDMKL, Warangal, Andhra Pradesh, India"],"affiliations":[{"raw_affiliation_string":"National Institute of Technology and IIITDMKL, Warangal, Andhra Pradesh, India","institution_ids":["https://openalex.org/I121750182","https://openalex.org/I207223250","https://openalex.org/I39244652"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014324813","display_name":"Binay Pradhan","orcid":"https://orcid.org/0000-0002-6318-3241"},"institutions":[{"id":"https://openalex.org/I188963388","display_name":"International Institute of Information Technology","ror":"https://ror.org/02dernx73","country_code":"IN","type":"education","lineage":["https://openalex.org/I188963388"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Binay Pradhan","raw_affiliation_strings":["International Institute of Information Technology, Odisha, India"],"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology, Odisha, India","institution_ids":["https://openalex.org/I188963388"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5108784869"],"corresponding_institution_ids":["https://openalex.org/I4210153924"],"apc_list":null,"apc_paid":null,"fwci":1.9204,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.88683884,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"19","issue":"4","first_page":"1","last_page":"31"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7840638756752014},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6298593282699585},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6228301525115967},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5952172875404358},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.5212855339050293},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4279952347278595},{"id":"https://openalex.org/keywords/code-mixing","display_name":"Code-mixing","score":0.41452616453170776},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.3641950488090515},{"id":"https://openalex.org/keywords/code-switching","display_name":"Code-switching","score":0.2735744118690491},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.233035147190094},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.19285327196121216}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7840638756752014},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6298593282699585},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6228301525115967},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5952172875404358},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.5212855339050293},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4279952347278595},{"id":"https://openalex.org/C2778598016","wikidata":"https://www.wikidata.org/wiki/Q3201279","display_name":"Code-mixing","level":3,"score":0.41452616453170776},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3641950488090515},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.2735744118690491},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.233035147190094},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.19285327196121216},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3380967","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3380967","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7599999904632568}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1524281572","https://openalex.org/W1538021842","https://openalex.org/W1631063262","https://openalex.org/W1783519389","https://openalex.org/W1977877104","https://openalex.org/W2041365579","https://openalex.org/W2064576795","https://openalex.org/W2064675550","https://openalex.org/W2071797522","https://openalex.org/W2105842272","https://openalex.org/W2116410915","https://openalex.org/W2117130368","https://openalex.org/W2121227244","https://openalex.org/W2121407024","https://openalex.org/W2131774270","https://openalex.org/W2139645402","https://openalex.org/W2139885235","https://openalex.org/W2150155583","https://openalex.org/W2219211395","https://openalex.org/W2236357521","https://openalex.org/W2250539671","https://openalex.org/W2250548009","https://openalex.org/W2251161416","https://openalex.org/W2251559320","https://openalex.org/W2251678408","https://openalex.org/W2251843872","https://openalex.org/W2296283641","https://openalex.org/W2343954916","https://openalex.org/W2423413767","https://openalex.org/W2493916176","https://openalex.org/W2560674852","https://openalex.org/W2560970694","https://openalex.org/W2561042415","https://openalex.org/W2743040064","https://openalex.org/W2750779823","https://openalex.org/W2778360819","https://openalex.org/W2784050058","https://openalex.org/W2796103437","https://openalex.org/W2798348125","https://openalex.org/W2891252302","https://openalex.org/W2952594430","https://openalex.org/W2955750298","https://openalex.org/W2963625095","https://openalex.org/W2963687836","https://openalex.org/W2964266863","https://openalex.org/W4205807230","https://openalex.org/W4237155282","https://openalex.org/W4302411445"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4390411868","https://openalex.org/W2734357165","https://openalex.org/W2794189087","https://openalex.org/W2946888518","https://openalex.org/W143242002","https://openalex.org/W2264886721","https://openalex.org/W1960112736","https://openalex.org/W4226263902","https://openalex.org/W2800058963"],"abstract_inverted_index":{"Social":[0],"media":[1,16,36,72],"data":[2,89,165],"has":[3],"become":[4],"invaluable":[5],"component":[6],"of":[7,12,14,21,28,81,85,100,107,123,126,149,215,221,243,249,258,261,267,277],"business":[8],"analytics.":[9],"A":[10,255],"multitude":[11],"nuances":[13],"social":[15,35,71],"text":[17,23,29,74,119,139,175,191,226,245],"make":[18],"the":[19,49,55,98,105,121,170,219,259,275,286],"job":[20],"conventional":[22],"analytical":[24],"tools":[25],"difficult.":[26],"Code-mixing":[27],"is":[30,90,103,133,140,160,269,283],"a":[31,78,203,237],"phenomenon":[32],"prevalent":[33],"among":[34],"users,":[37],"wherein":[38],"words":[39,110,129],"used":[40,202],"are":[41],"borrowed":[42],"from":[43,117,251],"multiple":[44,95,150],"languages,":[45,300],"though":[46],"written":[47],"in":[48,94,130,168,224,294],"commonly":[50],"understood":[51],"roman":[52,131],"script.":[53],"All":[54],"existing":[56,253],"supervised":[57],"learning":[58,115],"methods":[59],"for":[60,69,137,176,183,189,194,240],"tasks":[61],"such":[62,86],"as":[63,120,142],"Parts":[64],"Of":[65],"Speech":[66],"(POS)":[67],"tagging":[68,136,143,223,242],"code-mixed":[70,138,174,190],"(CMSM)":[73],"typically":[75],"depend":[76],"on":[77,213],"large":[79,87],"amount":[80],"training":[82,88],"data.":[83],"Preparation":[84],"resource-intensive,":[91],"requiring":[92],"expertise":[93],"languages.":[96,151],"Though":[97],"preparation":[99],"small":[101],"dataset":[102],"possible,":[104],"out":[106],"vocabulary":[108],"(OOV)":[109],"pose":[111],"major":[112],"difficulty,":[113],"while":[114],"models":[116],"CMSM":[118,225,244],"number":[122],"different":[124],"ways":[125],"writing":[127],"non-native":[128],"script":[132],"huge.":[134],"POS":[135,177,222,241],"non-trivial,":[141],"should":[144],"deal":[145],"with":[146,209,264,280],"syntactic":[147],"rules":[148],"The":[152,271],"important":[153],"research":[154],"question":[155],"addressed":[156],"by":[157,173,227,246,289],"this":[158],"article":[159],"whether":[161],"abundantly":[162],"available":[163],"unlabeled":[164],"can":[166],"help":[167],"resolving":[169],"difficulties":[171],"posed":[172],"tagging.":[178],"We":[179,201,235],"develop":[180],"an":[181,252],"approach":[182,263,279],"scraping":[184],"and":[185,197,232,292,298],"building":[186],"word":[187,230],"embeddings":[188,282],"illustrating":[192],"it":[193,216],"Bengali-English,":[195],"Hindi-English,":[196],"Telugu-English":[198],"code-mixing":[199,268],"scenarios.":[200],"hierarchical":[204],"deep":[205],"recurrent":[206],"neural":[207],"network":[208],"linear-chain":[210],"CRF":[211],"layer":[212],"top":[214],"to":[217],"improve":[218],"performance":[220,260],"capturing":[228],"contextual":[229],"features":[231],"character-sequence\u2013based":[233],"information.":[234],"prepared":[236],"labeled":[238],"resource":[239],"correcting":[247],"19%":[248],"labels":[250],"resource.":[254],"detailed":[256],"analysis":[257],"our":[262,278],"varying":[265],"levels":[266],"provided.":[270],"results":[272],"indicate":[273],"that":[274],"F1-score":[276],"custom":[281],"better":[284],"than":[285],"CRF-based":[287],"baseline":[288],"5.81%,":[290],"5.69%,":[291],"6.3%":[293],"Bengali,":[295],"Hindi":[296],",":[297],"Telugu":[299],"respectively.":[301]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2025-10-10T00:00:00"}
