{"id":"https://openalex.org/W3035362865","doi":"https://doi.org/10.1142/s2196888820500207","title":"New Descriptors of Textual Records: Getting Help from Frequent Itemsets","display_name":"New Descriptors of Textual Records: Getting Help from Frequent Itemsets","publication_year":2020,"publication_date":"2020-06-08","ids":{"openalex":"https://openalex.org/W3035362865","doi":"https://doi.org/10.1142/s2196888820500207","mag":"3035362865"},"language":"en","primary_location":{"id":"doi:10.1142/s2196888820500207","is_oa":true,"landing_page_url":"https://doi.org/10.1142/s2196888820500207","pdf_url":null,"source":{"id":"https://openalex.org/S2486636169","display_name":"Vietnam Journal of Computer Science","issn_l":"2196-8888","issn":["2196-8888","2196-8896"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Vietnam Journal of Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1142/s2196888820500207","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057517985","display_name":"Ayoub Bokhabrine","orcid":null},"institutions":[{"id":"https://openalex.org/I63341726","display_name":"Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res","ror":"https://ror.org/02xrw9r68","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120","https://openalex.org/I63341726"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ayoub Bokhabrine","raw_affiliation_strings":["D\u00e9partement de math\u00e9matiques et d\u2019informatique, Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res, 3351 boulevard des forges, Trois-Rivi\u00e8res, Qu\u00e9bec G8Z 4M3, Canada"],"affiliations":[{"raw_affiliation_string":"D\u00e9partement de math\u00e9matiques et d\u2019informatique, Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res, 3351 boulevard des forges, Trois-Rivi\u00e8res, Qu\u00e9bec G8Z 4M3, Canada","institution_ids":["https://openalex.org/I63341726"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087659866","display_name":"Isma\u00efl Biskri","orcid":"https://orcid.org/0000-0002-7644-5810"},"institutions":[{"id":"https://openalex.org/I63341726","display_name":"Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res","ror":"https://ror.org/02xrw9r68","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120","https://openalex.org/I63341726"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Isma\u00efl Biskri","raw_affiliation_strings":["D\u00e9partement de math\u00e9matiques et d\u2019informatique, Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res, 3351 boulevard des forges, Trois-Rivi\u00e8res, Qu\u00e9bec G8Z 4M3, Canada"],"affiliations":[{"raw_affiliation_string":"D\u00e9partement de math\u00e9matiques et d\u2019informatique, Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res, 3351 boulevard des forges, Trois-Rivi\u00e8res, Qu\u00e9bec G8Z 4M3, Canada","institution_ids":["https://openalex.org/I63341726"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063145283","display_name":"Nadia Ghazzali","orcid":null},"institutions":[{"id":"https://openalex.org/I63341726","display_name":"Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res","ror":"https://ror.org/02xrw9r68","country_code":"CA","type":"education","lineage":["https://openalex.org/I49663120","https://openalex.org/I63341726"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Nadia Ghazzali","raw_affiliation_strings":["D\u00e9partement de math\u00e9matiques et d\u2019informatique, Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res, 3351 boulevard des forges, Trois-Rivi\u00e8res, Qu\u00e9bec G8Z 4M3, Canada"],"affiliations":[{"raw_affiliation_string":"D\u00e9partement de math\u00e9matiques et d\u2019informatique, Universit\u00e9 du Qu\u00e9bec \u00e0 Trois-Rivi\u00e8res, 3351 boulevard des forges, Trois-Rivi\u00e8res, Qu\u00e9bec G8Z 4M3, Canada","institution_ids":["https://openalex.org/I63341726"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5087659866"],"corresponding_institution_ids":["https://openalex.org/I63341726"],"apc_list":null,"apc_paid":null,"fwci":0.8007,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.79746758,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"07","issue":"04","first_page":"355","last_page":"372"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7794299125671387},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6911890506744385},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.6408068537712097},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6125479936599731},{"id":"https://openalex.org/keywords/medoid","display_name":"Medoid","score":0.6082904934883118},{"id":"https://openalex.org/keywords/keyword-extraction","display_name":"Keyword extraction","score":0.5401995778083801},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.531057596206665},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5270215272903442},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5158399939537048},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4573456943035126},{"id":"https://openalex.org/keywords/raw-data","display_name":"Raw data","score":0.4506545066833496},{"id":"https://openalex.org/keywords/document-clustering","display_name":"Document clustering","score":0.4380396902561188},{"id":"https://openalex.org/keywords/association-rule-learning","display_name":"Association rule learning","score":0.4195675849914551},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32215559482574463}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7794299125671387},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6911890506744385},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.6408068537712097},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6125479936599731},{"id":"https://openalex.org/C63085389","wikidata":"https://www.wikidata.org/wiki/Q4287912","display_name":"Medoid","level":3,"score":0.6082904934883118},{"id":"https://openalex.org/C2780288562","wikidata":"https://www.wikidata.org/wiki/Q25053353","display_name":"Keyword extraction","level":2,"score":0.5401995778083801},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.531057596206665},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5270215272903442},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5158399939537048},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4573456943035126},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.4506545066833496},{"id":"https://openalex.org/C177937566","wikidata":"https://www.wikidata.org/wiki/Q4223102","display_name":"Document clustering","level":3,"score":0.4380396902561188},{"id":"https://openalex.org/C193524817","wikidata":"https://www.wikidata.org/wiki/Q386780","display_name":"Association rule learning","level":2,"score":0.4195675849914551},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32215559482574463},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1142/s2196888820500207","is_oa":true,"landing_page_url":"https://doi.org/10.1142/s2196888820500207","pdf_url":null,"source":{"id":"https://openalex.org/S2486636169","display_name":"Vietnam Journal of Computer Science","issn_l":"2196-8888","issn":["2196-8888","2196-8896"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Vietnam Journal of Computer Science","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:d70483ca74374d57bd9fb32cdcd25be3","is_oa":true,"landing_page_url":"https://doaj.org/article/d70483ca74374d57bd9fb32cdcd25be3","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Vietnam Journal of Computer Science, Vol 7, Iss 4, Pp 355-372 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1142/s2196888820500207","is_oa":true,"landing_page_url":"https://doi.org/10.1142/s2196888820500207","pdf_url":null,"source":{"id":"https://openalex.org/S2486636169","display_name":"Vietnam Journal of Computer Science","issn_l":"2196-8888","issn":["2196-8888","2196-8896"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Vietnam Journal of Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.5600000023841858,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1484413656","https://openalex.org/W1528447234","https://openalex.org/W1944603233","https://openalex.org/W2016381774","https://openalex.org/W2045407077","https://openalex.org/W2064853889","https://openalex.org/W2066277072","https://openalex.org/W2102297485","https://openalex.org/W2612904781","https://openalex.org/W2778860343","https://openalex.org/W2971324562","https://openalex.org/W4235526601"],"related_works":["https://openalex.org/W2014988084","https://openalex.org/W1671077962","https://openalex.org/W2074401349","https://openalex.org/W4293203576","https://openalex.org/W3082457728","https://openalex.org/W4306887032","https://openalex.org/W4237492828","https://openalex.org/W2562074663","https://openalex.org/W3011501242","https://openalex.org/W2025763381"],"abstract_inverted_index":{"The":[0,24,85],"analysis":[1],"of":[2,11,17,26,28,37,59,74,91],"numerical":[3],"data,":[4],"whether":[5],"structured,":[6],"semi-structured,":[7],"or":[8,20],"raw,":[9],"is":[10,31],"paramount":[12],"importance":[13],"in":[14,71],"many":[15],"sectors":[16],"economic,":[18],"scientific,":[19],"simply":[21],"social":[22],"activity.":[23],"process":[25],"extraction":[27],"association":[29],"rules":[30],"based":[32],"on":[33,41],"the":[34,38,42,47,69,89,92],"lexical":[35],"quality":[36],"text":[39],"and":[40,65,82],"minimum":[43],"support":[44],"set":[45],"by":[46],"user.":[48],"In":[49],"this":[50],"paper,":[51],"we":[52],"implemented":[53],"a":[54],"platform":[55],"named":[56],"\u201cIDETEX\u201d":[57],"capable":[58],"extracting":[60],"itemsets":[61],"from":[62],"textual":[63],"data":[64],"using":[66],"it":[67],"for":[68,95],"experimentation":[70],"different":[72],"types":[73],"clustering":[75],"methods,":[76],"such":[77],"as":[78],"[Formula:":[79],"see":[80],"text]-Medoids":[81],"Hierarchical":[83],"clustering.":[84],"experiments":[86],"conducted":[87],"demonstrate":[88],"potential":[90],"proposed":[93],"approach":[94],"defining":[96],"similarity":[97],"between":[98],"segments.":[99]},"counts_by_year":[{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
