{"id":"https://openalex.org/W2809000540","doi":"https://doi.org/10.1145/3206098.3206099","title":"A new text representation method for clustering based on higher order Markov model","display_name":"A new text representation method for clustering based on higher order Markov model","publication_year":2018,"publication_date":"2018-04-09","ids":{"openalex":"https://openalex.org/W2809000540","doi":"https://doi.org/10.1145/3206098.3206099","mag":"2809000540"},"language":"en","primary_location":{"id":"doi:10.1145/3206098.3206099","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3206098.3206099","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Information System and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101481133","display_name":"Weifeng Yang","orcid":"https://orcid.org/0000-0002-4833-7185"},"institutions":[{"id":"https://openalex.org/I27688046","display_name":"Hunan Institute of Engineering","ror":"https://ror.org/03zj2rn70","country_code":"CN","type":"education","lineage":["https://openalex.org/I27688046"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weifeng Yang","raw_affiliation_strings":["College of Science, Hunan Institute of Engineering, Xiangtan City, China"],"affiliations":[{"raw_affiliation_string":"College of Science, Hunan Institute of Engineering, Xiangtan City, China","institution_ids":["https://openalex.org/I27688046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062084611","display_name":"Guosheng Han","orcid":"https://orcid.org/0000-0002-7712-6213"},"institutions":[{"id":"https://openalex.org/I4610292","display_name":"Xiangtan University","ror":"https://ror.org/00xsfaz62","country_code":"CN","type":"education","lineage":["https://openalex.org/I4610292"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guosheng Han","raw_affiliation_strings":["Key Laboratory of Intelligent Computing &amp; Information Processing of Ministry of Education, Xiangtan University, Xiangtan City, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Intelligent Computing &amp; Information Processing of Ministry of Education, Xiangtan University, Xiangtan City, China","institution_ids":["https://openalex.org/I4610292"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100991403","display_name":"Xiaoqiang Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I27688046","display_name":"Hunan Institute of Engineering","ror":"https://ror.org/03zj2rn70","country_code":"CN","type":"education","lineage":["https://openalex.org/I27688046"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoqiang Xie","raw_affiliation_strings":["College of Science, Hunan Institute of Engineering, Xiangtan City, China"],"affiliations":[{"raw_affiliation_string":"College of Science, Hunan Institute of Engineering, Xiangtan City, China","institution_ids":["https://openalex.org/I27688046"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101481133"],"corresponding_institution_ids":["https://openalex.org/I27688046"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.06917592,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.7047541737556458},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6545741558074951},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5845326781272888},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.5672498941421509},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5185157060623169},{"id":"https://openalex.org/keywords/maximum-entropy-markov-model","display_name":"Maximum-entropy Markov model","score":0.48648616671562195},{"id":"https://openalex.org/keywords/variable-order-markov-model","display_name":"Variable-order Markov model","score":0.47147420048713684},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.46962881088256836},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.41979148983955383},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4144544303417206},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.31031686067581177},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.23495405912399292},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.14824241399765015}],"concepts":[{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.7047541737556458},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6545741558074951},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5845326781272888},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.5672498941421509},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5185157060623169},{"id":"https://openalex.org/C196956702","wikidata":"https://www.wikidata.org/wiki/Q6795829","display_name":"Maximum-entropy Markov model","level":5,"score":0.48648616671562195},{"id":"https://openalex.org/C54907487","wikidata":"https://www.wikidata.org/wiki/Q7915688","display_name":"Variable-order Markov model","level":4,"score":0.47147420048713684},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.46962881088256836},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.41979148983955383},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4144544303417206},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.31031686067581177},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.23495405912399292},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.14824241399765015},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3206098.3206099","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3206098.3206099","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Information System and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8600000143051147,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320315254","display_name":"Innovative Research Group Project of the National Natural Science Foundation of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W40976687","https://openalex.org/W244437071","https://openalex.org/W1500117362","https://openalex.org/W1533946607","https://openalex.org/W1608320902","https://openalex.org/W1956559956","https://openalex.org/W1969543361","https://openalex.org/W1985361918","https://openalex.org/W1995875735","https://openalex.org/W2007280555","https://openalex.org/W2029097226","https://openalex.org/W2049017883","https://openalex.org/W2058929792","https://openalex.org/W2071712180","https://openalex.org/W2081980673","https://openalex.org/W2110893883","https://openalex.org/W2129066856","https://openalex.org/W2150774511","https://openalex.org/W2153233077","https://openalex.org/W2167528246","https://openalex.org/W2180101149","https://openalex.org/W2321174411","https://openalex.org/W3123920865","https://openalex.org/W6685778296"],"related_works":["https://openalex.org/W2027903142","https://openalex.org/W2382132287","https://openalex.org/W3166133680","https://openalex.org/W2989366387","https://openalex.org/W2130519334","https://openalex.org/W4211010039","https://openalex.org/W2159877461","https://openalex.org/W2592341669","https://openalex.org/W2794873331","https://openalex.org/W2100055350"],"abstract_inverted_index":{"The":[0,118],"ordinal":[1,23,37,54],"relations":[2,24,38,55],"in":[3,42,70],"word":[4],"sequence":[5,8],"and":[6,19,28,106],"character":[7],"can":[9,56],"reflect":[10],"the":[11,22,36,43,53,61,65,88,107,113,122],"latent":[12],"information":[13,27],"about":[14],"writing":[15],"style,":[16],"genre":[17],"features":[18,103],"topic.":[20],"Thus,":[21],"are":[25,100],"important":[26],"should":[29],"be":[30,57],"considered":[31],"for":[32,84],"text":[33,47,85,124],"clustering.":[34,48],"However,":[35],"were":[39],"often":[40],"neglected":[41],"traditional":[44,130],"methods":[45],"of":[46,51,64,94,104],"In":[49,87],"view":[50],"that":[52],"statistically":[58],"characterized":[59],"by":[60,111],"transition":[62,92],"probabilities":[63,93],"higher":[66,78,96],"order":[67,79,97,108],"Markov":[68,80,98],"model,":[69],"this":[71],"paper,":[72],"a":[73,95],"new":[74,89,123],"method":[75,126],"based":[76],"on":[77],"model":[81,99],"was":[82],"proposed":[83],"representation.":[86],"method,":[90],"all":[91],"used":[101],"as":[102],"text,":[105],"is":[109],"identified":[110],"maximizing":[112],"average":[114],"Markov-Shannon":[115],"entropy":[116],"(MME).":[117],"experimental":[119],"results":[120],"imply":[121],"representation":[125],"performs":[127],"better":[128],"than":[129],"method.":[131]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
