{"id":"https://openalex.org/W4321089622","doi":"https://doi.org/10.1145/3582496","title":"Semantic Tagging for the Urdu Language: Annotated Corpus and Multi-Target Classification Methods","display_name":"Semantic Tagging for the Urdu Language: Annotated Corpus and Multi-Target Classification Methods","publication_year":2023,"publication_date":"2023-02-16","ids":{"openalex":"https://openalex.org/W4321089622","doi":"https://doi.org/10.1145/3582496"},"language":"en","primary_location":{"id":"doi:10.1145/3582496","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3582496","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3582496","source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3582496","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075488653","display_name":"Jawad Shafi","orcid":"https://orcid.org/0000-0001-6427-3823"},"institutions":[{"id":"https://openalex.org/I67415387","display_name":"Lancaster University","ror":"https://ror.org/04f2nsd36","country_code":"GB","type":"education","lineage":["https://openalex.org/I67415387"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Jawad Shafi","raw_affiliation_strings":["Department of Computer Science, COMSATS University Islamabad, Lahore Campus, and InfoLab21, Lancaster University, Lancaster, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, COMSATS University Islamabad, Lahore Campus, and InfoLab21, Lancaster University, Lancaster, U.K","institution_ids":["https://openalex.org/I67415387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005027058","display_name":"Rao Muhammad Adeel Nawab","orcid":"https://orcid.org/0000-0002-1765-8904"},"institutions":[{"id":"https://openalex.org/I16076960","display_name":"COMSATS University Islamabad","ror":"https://ror.org/00nqqvk19","country_code":"PK","type":"education","lineage":["https://openalex.org/I16076960"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Rao Muhammad Adeel Nawab","raw_affiliation_strings":["Department of Computer Science, COMSATS UniversityIslamabad, Lahore Campus, Pakistan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, COMSATS UniversityIslamabad, Lahore Campus, Pakistan","institution_ids":["https://openalex.org/I16076960"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058785189","display_name":"Paul Rayson","orcid":"https://orcid.org/0000-0002-1257-2191"},"institutions":[{"id":"https://openalex.org/I67415387","display_name":"Lancaster University","ror":"https://ror.org/04f2nsd36","country_code":"GB","type":"education","lineage":["https://openalex.org/I67415387"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paul Rayson","raw_affiliation_strings":["School of Computing and Communications, InfoLab21, Lancaster University, Lancaster, U.K"],"affiliations":[{"raw_affiliation_string":"School of Computing and Communications, InfoLab21, Lancaster University, Lancaster, U.K","institution_ids":["https://openalex.org/I67415387"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5075488653"],"corresponding_institution_ids":["https://openalex.org/I67415387"],"apc_list":null,"apc_paid":null,"fwci":1.5629,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.85764795,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"22","issue":"6","first_page":"1","last_page":"32"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8631802797317505},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7803627252578735},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6732789278030396},{"id":"https://openalex.org/keywords/explicit-semantic-analysis","display_name":"Explicit semantic analysis","score":0.5353530049324036},{"id":"https://openalex.org/keywords/semantic-computing","display_name":"Semantic computing","score":0.5117821097373962},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.47627466917037964},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.42709171772003174},{"id":"https://openalex.org/keywords/semantic-role-labeling","display_name":"Semantic role labeling","score":0.4208371341228485},{"id":"https://openalex.org/keywords/semeval","display_name":"SemEval","score":0.41242778301239014},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3807670474052429},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.36541202664375305},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.22981411218643188},{"id":"https://openalex.org/keywords/semantic-technology","display_name":"Semantic technology","score":0.226179838180542},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.13655179738998413}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8631802797317505},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7803627252578735},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6732789278030396},{"id":"https://openalex.org/C173862523","wikidata":"https://www.wikidata.org/wiki/Q5421270","display_name":"Explicit semantic analysis","level":5,"score":0.5353530049324036},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.5117821097373962},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.47627466917037964},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.42709171772003174},{"id":"https://openalex.org/C67277372","wikidata":"https://www.wikidata.org/wiki/Q7449085","display_name":"Semantic role labeling","level":3,"score":0.4208371341228485},{"id":"https://openalex.org/C44572571","wikidata":"https://www.wikidata.org/wiki/Q7448970","display_name":"SemEval","level":3,"score":0.41242778301239014},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3807670474052429},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.36541202664375305},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.22981411218643188},{"id":"https://openalex.org/C6881194","wikidata":"https://www.wikidata.org/wiki/Q7449091","display_name":"Semantic technology","level":4,"score":0.226179838180542},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.13655179738998413},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3582496","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3582496","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3582496","source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"},{"id":"pmh:oai:eprints.lancs.ac.uk:199811","is_oa":true,"landing_page_url":null,"pdf_url":"https://eprints.lancs.ac.uk/id/eprint/199811/1/3582496_1_.pdf","source":{"id":"https://openalex.org/S4306401916","display_name":"Lancaster EPrints (Lancaster University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67415387","host_organization_name":"Lancaster University","host_organization_lineage":["https://openalex.org/I67415387"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":{"id":"doi:10.1145/3582496","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3582496","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3582496","source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7900000214576721,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"},{"id":"https://openalex.org/F4320334322","display_name":"HORIZON EUROPE Framework Programme","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4321089622.pdf","grobid_xml":"https://content.openalex.org/works/W4321089622.grobid-xml"},"referenced_works_count":75,"referenced_works":["https://openalex.org/W21766150","https://openalex.org/W22182018","https://openalex.org/W173369501","https://openalex.org/W342998476","https://openalex.org/W1486097837","https://openalex.org/W1495836335","https://openalex.org/W1498990157","https://openalex.org/W1524281572","https://openalex.org/W1551268210","https://openalex.org/W1555354714","https://openalex.org/W1555414055","https://openalex.org/W1594112393","https://openalex.org/W1596967103","https://openalex.org/W1787860060","https://openalex.org/W1795234945","https://openalex.org/W1880262756","https://openalex.org/W1967542092","https://openalex.org/W1977109256","https://openalex.org/W1977182536","https://openalex.org/W1985912861","https://openalex.org/W1994180792","https://openalex.org/W1999954155","https://openalex.org/W2005329858","https://openalex.org/W2006462052","https://openalex.org/W2029517229","https://openalex.org/W2054460891","https://openalex.org/W2058349743","https://openalex.org/W2077656994","https://openalex.org/W2100495367","https://openalex.org/W2101837219","https://openalex.org/W2102381086","https://openalex.org/W2114315281","https://openalex.org/W2116555906","https://openalex.org/W2119656664","https://openalex.org/W2120699290","https://openalex.org/W2127293965","https://openalex.org/W2127358574","https://openalex.org/W2128354940","https://openalex.org/W2129906471","https://openalex.org/W2156468487","https://openalex.org/W2159882563","https://openalex.org/W2325637306","https://openalex.org/W2398778769","https://openalex.org/W2428981601","https://openalex.org/W2436001372","https://openalex.org/W2483327705","https://openalex.org/W2531638282","https://openalex.org/W2534494861","https://openalex.org/W2560656125","https://openalex.org/W2608239929","https://openalex.org/W2614261290","https://openalex.org/W2614673973","https://openalex.org/W2676554382","https://openalex.org/W2715319929","https://openalex.org/W2771576526","https://openalex.org/W2809755228","https://openalex.org/W2891165828","https://openalex.org/W2901223329","https://openalex.org/W2903296288","https://openalex.org/W2936459239","https://openalex.org/W3002035509","https://openalex.org/W3124063403","https://openalex.org/W4206707056","https://openalex.org/W4211125870","https://openalex.org/W4229966930","https://openalex.org/W4242626930","https://openalex.org/W4244355702","https://openalex.org/W4294214983","https://openalex.org/W4296468769","https://openalex.org/W4365799834","https://openalex.org/W4389014815","https://openalex.org/W6611626601","https://openalex.org/W6629012200","https://openalex.org/W6756184450","https://openalex.org/W7010502027"],"related_works":["https://openalex.org/W2103835134","https://openalex.org/W1965623300","https://openalex.org/W3134365128","https://openalex.org/W2359259132","https://openalex.org/W3016822073","https://openalex.org/W2807098362","https://openalex.org/W2774861092","https://openalex.org/W2114077504","https://openalex.org/W4376876329","https://openalex.org/W2032956642"],"abstract_inverted_index":{"Extracting":[0],"and":[1,27,38,70,79,112,116,136,156,172,199,218,254,299,310,317,339],"analysing":[2],"meaning-related":[3],"information":[4,25,36],"from":[5,108,313],"natural":[6,20],"language":[7,21,44,269],"data":[8,28,45],"has":[9,209,247],"attracted":[10],"the":[11,41,90,94,149,159,175,180,190,222,268,276,297,314],"attention":[12],"of":[13,33,43,62,86,144,235,267,278,301,330],"researchers":[14],"in":[15,89,189,243],"various":[16,60,127],"fields,":[17],"such":[18,34],"as":[19,104,281],"processing,":[22],"corpus":[23,171,185,208,246,292,316,335],"linguistics,":[24],"retrieval,":[26],"science.":[29],"An":[30],"important":[31],"aspect":[32],"automatic":[35],"extraction":[37],"analysis":[39,266],"is":[40,93,141,153,337],"annotation":[42],"using":[46],"semantic":[47,51,63,80,128,176,216,228,236,258,265,279,303,311],"tagging":[48,52,129,177,280,304],"tools.":[49],"Different":[50],"tools":[53],"have":[54,123],"been":[55,124,210,248],"designed":[56],"to":[57,84,110,256,261,274,324,342],"carry":[58],"out":[59],"levels":[61],"analysis,":[64,73,78],"for":[65,96,126,134,148,174,179,238,296],"instance,":[66],"named":[67],"entity":[68],"recognition":[69],"disambiguation,":[71,76],"sentiment":[72],"word":[74,115,242],"sense":[75,118],"content":[77],"role":[81],"labelling.":[82],"Common":[83],"all":[85],"these":[87],"tasks,":[88,130],"supervised":[91,283,321],"setting,":[92],"requirement":[95],"a":[97,105,142,168,232,263,282],"manually":[98,211],"semantically":[99,145],"annotated":[100,146,212,249],"corpus,":[101],"which":[102,109,152,230,271,336],"acts":[103],"knowledge":[106],"base":[107],"train":[111],"test":[113],"potential":[114],"phrase-level":[117],"annotations.":[119],"Many":[120],"benchmark":[121,170],"corpora":[122,147],"developed":[125],"but":[131],"most":[132],"are":[133],"English":[135],"other":[137],"European":[138],"languages.":[139],"There":[140],"dearth":[143],"Urdu":[150,181,302],"language,":[151],"widely":[154],"spoken":[155],"used":[157,295],"around":[158],"world.":[160],"To":[161,287],"fill":[162],"this":[163,165],"gap,":[164],"study":[166],"presents":[167],"large":[169],"methods":[173],"task":[178],"language.":[182],"The":[183,207],"proposed":[184,245,291,315,334],"contains":[186],"8,000":[187],"tokens":[188],"following":[191],"domains":[192],"or":[193],"genres:":[194],"news,":[195],"social":[196],"media,":[197],"Wikipedia,":[198],"historical":[200],"text":[201],"(each":[202],"domain":[203],"having":[204],"2K":[205],"tokens).":[206],"with":[213,221,250],"21":[214],"major":[215],"fields":[217,237],"232":[219],"sub-fields":[220],"USAS":[223],"(UCREL":[224],"Semantic":[225],"Analysis":[226],"System)":[227],"taxonomy":[229],"provides":[231],"comprehensive":[233],"set":[234],"coarse-grained":[239],"annotation.":[240],"Each":[241],"our":[244,290,333],"at":[251],"least":[252],"one":[253],"up":[255],"nine":[257],"field":[259],"tags":[260],"provide":[262],"detailed":[264],"data,":[270],"allowed":[272],"us":[273],"treat":[275],"problem":[277],"multi-target":[284,322],"classification":[285],"task.":[286],"demonstrate":[288],"how":[289],"can":[293],"be":[294],"development":[298],"evaluation":[300],"methods,":[305],"we":[306],"extracted":[307],"local,":[308],"topical":[309],"features":[312],"applied":[318],"seven":[319],"different":[320],"classifiers":[323],"them.":[325],"Results":[326],"show":[327],"an":[328],"accuracy":[329],"94%":[331],"on":[332],"free":[338],"publicly":[340],"available":[341],"download.":[343]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":3}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
