{"id":"https://openalex.org/W3136188561","doi":"https://doi.org/10.4114/intartif.vol24iss67pp1-17","title":"Morphological Skip-Gram: Replacing FastText characters n-gram with morphological knowledge","display_name":"Morphological Skip-Gram: Replacing FastText characters n-gram with morphological knowledge","publication_year":2021,"publication_date":"2021-02-20","ids":{"openalex":"https://openalex.org/W3136188561","doi":"https://doi.org/10.4114/intartif.vol24iss67pp1-17","mag":"3136188561"},"language":"en","primary_location":{"id":"doi:10.4114/intartif.vol24iss67pp1-17","is_oa":true,"landing_page_url":"https://doi.org/10.4114/intartif.vol24iss67pp1-17","pdf_url":"http://journal.iberamia.org/index.php/intartif/article/download/588/139","source":{"id":"https://openalex.org/S4210203986","display_name":"INTELIGENCIA ARTIFICIAL","issn_l":"1137-3601","issn":["1137-3601","1988-3064"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310321681","host_organization_name":"Asociaci\u00f3n Espa\u00f1ola para la Inteligencia Artificial","host_organization_lineage":["https://openalex.org/P4310321681"],"host_organization_lineage_names":["Asociaci\u00f3n Espa\u00f1ola para la Inteligencia Artificial"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Inteligencia Artificial","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"http://journal.iberamia.org/index.php/intartif/article/download/588/139","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062021162","display_name":"Fl\u00e1vio Santos","orcid":"https://orcid.org/0000-0003-2378-5376"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Fl\u00e1vio Arthur O. Santos","raw_affiliation_strings":["Universidade Federal de Pernambuco, Centro de Informatica, Recife, Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidade Federal de Pernambuco, Centro de Informatica, Recife, Brazil","institution_ids":["https://openalex.org/I25112270"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009574728","display_name":"Thiago Dias Bispo","orcid":"https://orcid.org/0000-0002-8588-0080"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Thiago Dias Bispo","raw_affiliation_strings":["Universidade Federal de Pernambuco, Centro de Informatica, Recife, Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidade Federal de Pernambuco, Centro de Informatica, Recife, Brazil","institution_ids":["https://openalex.org/I25112270"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048968559","display_name":"Hendrik Macedo","orcid":"https://orcid.org/0000-0002-6477-756X"},"institutions":[{"id":"https://openalex.org/I190085865","display_name":"Universidade Federal de Sergipe","ror":"https://ror.org/028ka0n85","country_code":"BR","type":"education","lineage":["https://openalex.org/I190085865"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Hendrik Teixeira Macedo","raw_affiliation_strings":["Universidade Federal de Sergipe, Departamento de Computacao, Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidade Federal de Sergipe, Departamento de Computacao, Brazil","institution_ids":["https://openalex.org/I190085865"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086345001","display_name":"Cleber Zanchettin","orcid":"https://orcid.org/0000-0001-6421-9747"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Cleber Zanchettin","raw_affiliation_strings":["Universidade Federal de Pernambuco, Centro de Informatica, Recife, Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidade Federal de Pernambuco, Centro de Informatica, Recife, Brazil","institution_ids":["https://openalex.org/I25112270"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5062021162"],"corresponding_institution_ids":["https://openalex.org/I25112270"],"apc_list":null,"apc_paid":null,"fwci":0.6996,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.75348356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"24","issue":"67","first_page":"1","last_page":"17"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7898987531661987},{"id":"https://openalex.org/keywords/morpheme","display_name":"Morpheme","score":0.7115440368652344},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7089018225669861},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.694826066493988},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6713180541992188},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.5794331431388855},{"id":"https://openalex.org/keywords/word2vec","display_name":"Word2vec","score":0.5772584676742554},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.5589425563812256},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.47015881538391113},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2292499542236328},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.21516773104667664}],"concepts":[{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7898987531661987},{"id":"https://openalex.org/C165297611","wikidata":"https://www.wikidata.org/wiki/Q43249","display_name":"Morpheme","level":2,"score":0.7115440368652344},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7089018225669861},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.694826066493988},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6713180541992188},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.5794331431388855},{"id":"https://openalex.org/C2776461190","wikidata":"https://www.wikidata.org/wiki/Q22673982","display_name":"Word2vec","level":3,"score":0.5772584676742554},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.5589425563812256},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.47015881538391113},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2292499542236328},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.21516773104667664},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.4114/intartif.vol24iss67pp1-17","is_oa":true,"landing_page_url":"https://doi.org/10.4114/intartif.vol24iss67pp1-17","pdf_url":"http://journal.iberamia.org/index.php/intartif/article/download/588/139","source":{"id":"https://openalex.org/S4210203986","display_name":"INTELIGENCIA ARTIFICIAL","issn_l":"1137-3601","issn":["1137-3601","1988-3064"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310321681","host_organization_name":"Asociaci\u00f3n Espa\u00f1ola para la Inteligencia Artificial","host_organization_lineage":["https://openalex.org/P4310321681"],"host_organization_lineage_names":["Asociaci\u00f3n Espa\u00f1ola para la Inteligencia Artificial"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Inteligencia Artificial","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:7c2bcdd6ac834de2bc926bce27d42147","is_oa":true,"landing_page_url":"https://doaj.org/article/7c2bcdd6ac834de2bc926bce27d42147","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Inteligencia Artificial, Vol 24, Iss 67 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.4114/intartif.vol24iss67pp1-17","is_oa":true,"landing_page_url":"https://doi.org/10.4114/intartif.vol24iss67pp1-17","pdf_url":"http://journal.iberamia.org/index.php/intartif/article/download/588/139","source":{"id":"https://openalex.org/S4210203986","display_name":"INTELIGENCIA ARTIFICIAL","issn_l":"1137-3601","issn":["1137-3601","1988-3064"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310321681","host_organization_name":"Asociaci\u00f3n Espa\u00f1ola para la Inteligencia Artificial","host_organization_lineage":["https://openalex.org/P4310321681"],"host_organization_lineage_names":["Asociaci\u00f3n Espa\u00f1ola para la Inteligencia Artificial"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Inteligencia Artificial","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2823776494","display_name":null,"funder_award_id":"88887","funder_id":"https://openalex.org/F4320321091","funder_display_name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior"},{"id":"https://openalex.org/G3527345606","display_name":null,"funder_award_id":"11/2016","funder_id":"https://openalex.org/F4320321091","funder_display_name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior"}],"funders":[{"id":"https://openalex.org/F4320321091","display_name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior","ror":"https://ror.org/00x0ma614"},{"id":"https://openalex.org/F4320322025","display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","ror":"https://ror.org/03swz6y49"},{"id":"https://openalex.org/F4320323353","display_name":"Funda\u00e7\u00e3o de Apoio \u00e0 Pesquisa e \u00e0 Inova\u00e7\u00e3o Tecnol\u00f3gica do Estado de Sergipe","ror":"https://ror.org/028ka0n85"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3136188561.pdf","grobid_xml":"https://content.openalex.org/works/W3136188561.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W1569415500","https://openalex.org/W1614298861","https://openalex.org/W1854884267","https://openalex.org/W2026487812","https://openalex.org/W2053921957","https://openalex.org/W2064675550","https://openalex.org/W2080100102","https://openalex.org/W2081580037","https://openalex.org/W2094728533","https://openalex.org/W2098801107","https://openalex.org/W2112184938","https://openalex.org/W2135964261","https://openalex.org/W2141599568","https://openalex.org/W2142377809","https://openalex.org/W2153579005","https://openalex.org/W2158899491","https://openalex.org/W2167949727","https://openalex.org/W2250539671","https://openalex.org/W2250618788","https://openalex.org/W2251012068","https://openalex.org/W2251044566","https://openalex.org/W2493916176","https://openalex.org/W2525778437","https://openalex.org/W2573169100","https://openalex.org/W2575842049","https://openalex.org/W2606342375","https://openalex.org/W2611669587","https://openalex.org/W2612675303","https://openalex.org/W2613977835","https://openalex.org/W2773621464","https://openalex.org/W2781491986","https://openalex.org/W2796547996","https://openalex.org/W2896457183","https://openalex.org/W2901215838","https://openalex.org/W2950577311","https://openalex.org/W2951714314","https://openalex.org/W2952230511","https://openalex.org/W2962739339","https://openalex.org/W2963341956","https://openalex.org/W3049711450","https://openalex.org/W3103061166","https://openalex.org/W4288287577","https://openalex.org/W4294170691","https://openalex.org/W4302027230","https://openalex.org/W4385245566","https://openalex.org/W4386506836"],"related_works":["https://openalex.org/W2905749112","https://openalex.org/W2346530426","https://openalex.org/W875474545","https://openalex.org/W3099354896","https://openalex.org/W2890749918","https://openalex.org/W4287599800","https://openalex.org/W2772765860","https://openalex.org/W4312264180","https://openalex.org/W4236073812","https://openalex.org/W3048777016"],"abstract_inverted_index":{"Natural":[0],"language":[1],"processing":[2],"systems":[3],"have":[4,166],"attracted":[5],"much":[6],"interest":[7],"of":[8,13,17,78,106,126,144,152,156,177,210,216,223],"the":[9,79,93,114,137,142,150,175,185,207,220,224,255,265,274,280],"industry.":[10],"This":[11,90,181],"branch":[12],"study":[14],"is":[15,141,159,204,268],"composed":[16],"some":[18,164],"applications":[19,46],"such":[20],"as":[21,49,123],"machine":[22,53],"translation,":[23],"sentiment":[24],"analysis,":[25],"named":[26],"entity":[27],"recognition,":[28],"question":[29],"and":[30,32,65,81,103,136,173,201,231,254,290],"answer,":[31],"others.":[33],"Word":[34],"embeddings":[35,62,95,117],"(i.e.,":[36],"continuous":[37,131],"word":[38,50,61,70,94,100,116,122,139,158,199,217],"representations)":[39],"are":[40,63,104,233],"an":[41],"essential":[42],"module":[43],"for":[44,87,197,213],"those":[45],"generally":[47],"used":[48],"representation":[51,85,140],"to":[52,59,205,238,262],"learning":[54],"models.":[55],"Some":[56],"popular":[57],"methods":[58],"train":[60],"GloVe":[64],"Word2Vec.":[66],"They":[67],"achieve":[68],"good":[69],"representations,":[71],"despite":[72],"limitations:":[73],"both":[74],"ignore":[75],"morphological":[76,221],"information":[77],"words":[80,172,227],"consider":[82,98],"only":[83],"one":[84],"vector":[86,132],"each":[88,121,134,239],"word.":[89,225],"approach":[91,162,182],"implies":[92],"does":[96],"not":[97],"different":[99,252,294],"contexts":[101],"properly":[102],"unaware":[105],"its":[107,145,202],"inner":[108],"structure.":[109],"To":[110,241],"mitigate":[111],"this":[112,190],"problem,":[113],"other":[115],"method":[118,196],"FastText":[119,208,272],"represents":[120],"a":[124,130,157,160,194,214,258],"bag":[125,209,215],"characters":[127,146],"n-grams.":[128],"Hence,":[129],"describes":[133],"n-gram,":[135],"final":[138],"sum":[143],"n-grams":[147,154,165,212],"vectors.":[148],"Nevertheless,":[149],"use":[151],"all":[153],"character":[155,211],"poor":[161],"since":[163],"no":[167],"semantic":[168],"relation":[169],"with":[170,228],"their":[171],"increase":[174,184],"amount":[176],"potentially":[178],"useless":[179],"information.":[180],"also":[183,278],"training":[186,198,275],"phase":[187],"time.":[188],"In":[189],"work,":[191],"we":[192,246],"propose":[193],"new":[195,244],"embeddings,":[200],"goal":[203],"replace":[206],"morphemes":[218,232],"through":[219,286],"analysis":[222],"Thus,":[226],"similar":[229],"context":[230],"represented":[234],"by":[235],"vectors":[236],"close":[237],"other.":[240],"evaluate":[242],"our":[243],"approach,":[245],"performed":[247],"intrinsic":[248],"evaluations":[249,285],"considering":[250],"15":[251],"tasks,":[253],"results":[256],"show":[257],"competitive":[259],"performance":[260],"compared":[261],"FastText.":[263],"Moreover,":[264],"proposed":[266],"model":[267],"$40\\%$":[269],"faster":[270],"than":[271],"in":[273,283],"phase.":[276],"We":[277],"outperform":[279],"baseline":[281],"approaches":[282],"extrinsic":[284],"Hate":[287],"speech":[288],"detection":[289],"NER":[291],"tasks":[292],"using":[293],"scenarios.":[295]},"counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
