{"id":"https://openalex.org/W3098781046","doi":"https://doi.org/10.5220/0010109803500360","title":"Mining M-Grams by a Granular Computing Approach for Text Classification","display_name":"Mining M-Grams by a Granular Computing Approach for Text Classification","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3098781046","doi":"https://doi.org/10.5220/0010109803500360","mag":"3098781046"},"language":"en","primary_location":{"id":"doi:10.5220/0010109803500360","is_oa":false,"landing_page_url":"https://doi.org/10.5220/0010109803500360","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th International Joint Conference on Computational Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/11573/1461477","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072229274","display_name":"Antonino Capillo","orcid":"https://orcid.org/0000-0002-6360-7737"},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Antonino Capillo","raw_affiliation_strings":["Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020616232","display_name":"Enrico De Santis","orcid":"https://orcid.org/0000-0003-4915-0723"},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Enrico de Santis","raw_affiliation_strings":["Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085653924","display_name":"Fabio Massimo Frattale Mascioli","orcid":"https://orcid.org/0000-0002-3748-5019"},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Fabio Mascioli","raw_affiliation_strings":["Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---","institution_ids":["https://openalex.org/I861853513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025282612","display_name":"Antonello Rizzi","orcid":null},"institutions":[{"id":"https://openalex.org/I861853513","display_name":"Sapienza University of Rome","ror":"https://ror.org/02be6w209","country_code":"IT","type":"education","lineage":["https://openalex.org/I861853513"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Antonello Rizzi","raw_affiliation_strings":["Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering, Electronics and Telecommunications, University of Rome \u201cLa Sapienza\u201d, Via Eudossiana 18, 00184 Rome, Italy, --- Select a Country ---","institution_ids":["https://openalex.org/I861853513"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5072229274"],"corresponding_institution_ids":["https://openalex.org/I861853513"],"apc_list":null,"apc_paid":null,"fwci":0.7036,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.7690906,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"350","last_page":"360"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9147999882698059,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11727","display_name":"Advanced Algebra and Logic","score":0.9133999943733215,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6783494353294373},{"id":"https://openalex.org/keywords/granular-computing","display_name":"Granular computing","score":0.44279745221138},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41531702876091003},{"id":"https://openalex.org/keywords/rough-set","display_name":"Rough set","score":0.10485997796058655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6783494353294373},{"id":"https://openalex.org/C17209119","wikidata":"https://www.wikidata.org/wiki/Q5596712","display_name":"Granular computing","level":3,"score":0.44279745221138},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41531702876091003},{"id":"https://openalex.org/C111012933","wikidata":"https://www.wikidata.org/wiki/Q3137210","display_name":"Rough set","level":2,"score":0.10485997796058655}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0010109803500360","is_oa":false,"landing_page_url":"https://doi.org/10.5220/0010109803500360","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 12th International Joint Conference on Computational Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:iris.uniroma1.it:11573/1461477","is_oa":true,"landing_page_url":"http://hdl.handle.net/11573/1461477","pdf_url":null,"source":{"id":"https://openalex.org/S4377196107","display_name":"IRIS Research product catalog (Sapienza University of Rome)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:iris.uniroma1.it:11573/1461477","is_oa":true,"landing_page_url":"http://hdl.handle.net/11573/1461477","pdf_url":null,"source":{"id":"https://openalex.org/S4377196107","display_name":"IRIS Research product catalog (Sapienza University of Rome)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2350522004","https://openalex.org/W2370755174","https://openalex.org/W2377101006","https://openalex.org/W2187139637","https://openalex.org/W2350247864","https://openalex.org/W2112263672","https://openalex.org/W3013364385","https://openalex.org/W1795409297","https://openalex.org/W4299125407"],"abstract_inverted_index":{"Text":[0],"mining":[1],"and":[2,8,90,122,223],"text":[3,48],"classification":[4,21,153,222],"are":[5,17,56,71,120],"gaining":[6],"more":[7,9],"importance":[10],"in":[11,86,134,139,159,194],"AI":[12,203],"related":[13],"research":[14],"fields.":[15],"Researchers":[16],"particularly":[18],"focused":[19],"on":[20,24,96,219],"systems,":[22],"based":[23],"structured":[25],"data":[26],"(such":[27],"as":[28,145],"sequences":[29],"or":[30,62],"graphs),":[31],"facing":[32],"the":[33,75,97,111,116,152,197,208],"challenge":[34],"of":[35,65,118,161,200,207,217],"synthesizing":[36],"interpretable":[37],"models,":[38],"exploiting":[39],"gray-box":[40,47],"approaches.":[41],"In":[42],"this":[43],"paper,":[44],"a":[45,87,91,108,125,135,141,215],"novel":[46],"classifier":[49],"is":[50,84,100,158,166],"presented.":[51],"Documents":[52],"to":[53,103,168],"be":[54,185],"classified":[55],"split":[57],"into":[58,124],"their":[59],"constituent":[60],"words,":[61],"tokens.":[63],"Groups":[64],"frequent":[66],"m":[67],"tokens":[68],"(or":[69],"m-grams)":[70],"suitably":[72],"mined":[73],"adopting":[74],"Granular":[76],"Computing":[77],"framework.":[78],"By":[79],"fastText":[80],"algorithm,":[81],"each":[82,177],"token":[83],"encoded":[85],"real-valued":[88,137],"vector":[89],"custom-based":[92],"dissimilarity":[93],"measure,":[94],"grounded":[95],"Edit":[98],"family,":[99],"designed":[101],"specifically":[102],"deal":[104],"with":[105,151,196],"m-grams.":[106],"Through":[107],"clustering":[109],"procedure":[110],"most":[112,170],"representative":[113],"m-grams,":[114],"pertaining":[115],"corpus":[117],"documents,":[119],"extrapolated":[121],"arranged":[123],"Symbolic":[126],"Histogram":[127],"representation.":[128],"The":[129,205],"latter":[130],"allows":[131],"embedding":[132],"documents":[133],"well-suited":[136],"space":[138],"which":[140,165],"standard":[142],"classifier,":[143],"such":[144],"SVM,":[146],"can":[147,184],"safety":[148],"operate.":[149],"Along":[150],"procedure,":[154,193],"an":[155,189],"Evolutionary":[156],"Algorithm":[157],"charge":[160],"performing":[162],"features":[163],"selection,":[164],"able":[167],"select":[169],"relevant":[171],"symbols":[172,183],"\u2013":[173,175],"m-grams":[174],"for":[176],"class.":[178],"This":[179],"study":[180],"shows":[181],"how":[182],"fruitfully":[186],"interpreted,":[187],"allowing":[188],"interesting":[190],"knowledge":[191],"discovery":[192],"lights":[195],"new":[198],"requirements":[199],"modern":[201],"explainable":[202],"systems.":[204],"effectiveness":[206],"proposed":[209],"algorithm":[210],"has":[211],"been":[212],"proved":[213],"through":[214],"set":[216],"experiments":[218],"paper":[220],"abstracts":[221],"SMS":[224],"spam":[225],"detection.":[226]},"counts_by_year":[{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
