{"id":"https://openalex.org/W2920184902","doi":"https://doi.org/10.1145/3297156.3297248","title":"A Hybrid Approach for Measuring Similarity between Government Documents of China","display_name":"A Hybrid Approach for Measuring Similarity between Government Documents of China","publication_year":2018,"publication_date":"2018-12-08","ids":{"openalex":"https://openalex.org/W2920184902","doi":"https://doi.org/10.1145/3297156.3297248","mag":"2920184902"},"language":"en","primary_location":{"id":"doi:10.1145/3297156.3297248","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3297156.3297248","pdf_url":null,"source":{"id":"https://openalex.org/S4306523626","display_name":"Proceedings of the 2018 2nd International Conference on Computer Science and Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 2nd International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084587716","display_name":"Zeyuan Li","orcid":"https://orcid.org/0009-0006-2088-8707"},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zeyuan Li","raw_affiliation_strings":["CETC Big Data Research Institute Co., Ltd., Guiyang, China"],"affiliations":[{"raw_affiliation_string":"CETC Big Data Research Institute Co., Ltd., Guiyang, China","institution_ids":["https://openalex.org/I4210096250"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049875848","display_name":"Jie He","orcid":null},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie He","raw_affiliation_strings":["CETC Big Data Research Institute Co., Ltd., Guiyang, China"],"affiliations":[{"raw_affiliation_string":"CETC Big Data Research Institute Co., Ltd., Guiyang, China","institution_ids":["https://openalex.org/I4210096250"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009434777","display_name":"Dagang Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dagang Chen","raw_affiliation_strings":["CETC Big Data Research Institute Co., Ltd., Guiyang, China"],"affiliations":[{"raw_affiliation_string":"CETC Big Data Research Institute Co., Ltd., Guiyang, China","institution_ids":["https://openalex.org/I4210096250"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046642410","display_name":"Xin Fang","orcid":"https://orcid.org/0000-0002-7274-8195"},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Fang","raw_affiliation_strings":["CETC Big Data Research Institute Co., Ltd., Guiyang, China"],"affiliations":[{"raw_affiliation_string":"CETC Big Data Research Institute Co., Ltd., Guiyang, China","institution_ids":["https://openalex.org/I4210096250"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075261068","display_name":"Yajun Song","orcid":"https://orcid.org/0000-0002-1543-4691"},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yajun Song","raw_affiliation_strings":["CETC Big Data Research Institute Co., Ltd., Guiyang, China"],"affiliations":[{"raw_affiliation_string":"CETC Big Data Research Institute Co., Ltd., Guiyang, China","institution_ids":["https://openalex.org/I4210096250"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044786927","display_name":"Zesong Li","orcid":"https://orcid.org/0000-0003-0975-4434"},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zesong Li","raw_affiliation_strings":["CETC Big Data Research Institute Co., Ltd., Guiyang, China"],"affiliations":[{"raw_affiliation_string":"CETC Big Data Research Institute Co., Ltd., Guiyang, China","institution_ids":["https://openalex.org/I4210096250"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5084587716"],"corresponding_institution_ids":["https://openalex.org/I4210096250"],"apc_list":null,"apc_paid":null,"fwci":0.3081,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.68189103,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"431","last_page":"435"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/government","display_name":"Government (linguistics)","score":0.7179300785064697},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.7037463188171387},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6907135248184204},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6436972618103027},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6281692981719971},{"id":"https://openalex.org/keywords/publication","display_name":"Publication","score":0.5099121332168579},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.49556124210357666},{"id":"https://openalex.org/keywords/china","display_name":"China","score":0.4374709725379944},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.41021788120269775},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.36848294734954834},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.2221439778804779},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18912893533706665},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.11778068542480469},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10972389578819275},{"id":"https://openalex.org/keywords/advertising","display_name":"Advertising","score":0.10438963770866394},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09045952558517456}],"concepts":[{"id":"https://openalex.org/C2778137410","wikidata":"https://www.wikidata.org/wiki/Q2732820","display_name":"Government (linguistics)","level":2,"score":0.7179300785064697},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.7037463188171387},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6907135248184204},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6436972618103027},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6281692981719971},{"id":"https://openalex.org/C41458344","wikidata":"https://www.wikidata.org/wiki/Q732577","display_name":"Publication","level":2,"score":0.5099121332168579},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.49556124210357666},{"id":"https://openalex.org/C191935318","wikidata":"https://www.wikidata.org/wiki/Q148","display_name":"China","level":2,"score":0.4374709725379944},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.41021788120269775},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.36848294734954834},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.2221439778804779},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18912893533706665},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.11778068542480469},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10972389578819275},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.10438963770866394},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09045952558517456},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3297156.3297248","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3297156.3297248","pdf_url":null,"source":{"id":"https://openalex.org/S4306523626","display_name":"Proceedings of the 2018 2nd International Conference on Computer Science and Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 2nd International Conference on Computer Science and Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.75,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W36021107","https://openalex.org/W100623710","https://openalex.org/W1880262756","https://openalex.org/W1980867644","https://openalex.org/W2117130368","https://openalex.org/W2127997067","https://openalex.org/W2130199334","https://openalex.org/W2131744502","https://openalex.org/W2136480620","https://openalex.org/W2158997610","https://openalex.org/W2262787892","https://openalex.org/W2294429012","https://openalex.org/W2534712034","https://openalex.org/W2748006193","https://openalex.org/W2772323297","https://openalex.org/W4213338820"],"related_works":["https://openalex.org/W3024364549","https://openalex.org/W4206019083","https://openalex.org/W2048865712","https://openalex.org/W1976265003","https://openalex.org/W2370378377","https://openalex.org/W4237510188","https://openalex.org/W2130160813","https://openalex.org/W2054476758","https://openalex.org/W2327130486","https://openalex.org/W1984597391"],"abstract_inverted_index":{"In":[0,131],"China,":[1,113],"the":[2,38,41,44,52,57,72,81,141,154,157,159,162,165,173,176,178,185,189,192,198,203],"government":[3,9,23,35,54,75,110,145,151,179],"publishes":[4],"hundreds":[5],"of":[6,8,74,97,147,156,188],"thousands":[7],"documents":[10,24,55,84,111,146,152,180],"every":[11],"year.":[12],"The":[13],"civil":[14],"servants":[15],"in":[16,62,71,112],"China":[17,63],"are":[18,68,115],"struggling":[19],"to":[20,40,50,87],"find":[21,51],"relevant":[22],"while":[25],"doing":[26],"their":[27],"office":[28],"works,":[29],"such":[30,64,89],"as":[31,65,90,125,153],"writing":[32],"documents,":[33],"analyzing":[34],"policy,":[36],"explaining":[37],"policy":[39],"public.":[42],"Furthermore,":[43],"public":[45],"also":[46],"finds":[47],"it":[48],"difficult":[49],"exact":[53],"since":[56],"most":[58,95],"popular":[59],"search":[60,91],"engines":[61],"Baidu,":[66],"Sogou":[67],"not":[69],"specialized":[70],"field":[73],"document":[76,160,163],"searching":[77],"and":[78,92,105,168,208],"indexing.":[79],"Determining":[80],"similarity":[82,102,143,174,181,190],"between":[83,103,144,175,191],"is":[85,182],"critical":[86],"applications":[88],"recommendation.":[93],"Currently,":[94],"kinds":[96],"literatures":[98],"focus":[99],"on":[100],"semantic":[101],"words":[104],"paragraph":[106],"fragments.":[107],"As":[108],"for":[109,139],"they":[114,121],"written":[116],"under":[117],"standards":[118],"so":[119],"that":[120,197],"can":[122],"be":[123],"considered":[124],"semi-structured":[126],"data":[127,129],"after":[128],"cleansing.":[130],"this":[132],"paper,":[133],"we":[134],"propose":[135],"a":[136],"hybrid":[137,200],"approach":[138],"measuring":[140],"document-level":[142],"China.":[148],"We":[149],"represent":[150],"publisher":[155],"document,":[158],"domain,":[161],"type,":[164],"publishing":[166],"time":[167],"other":[169],"contents.":[170],"By":[171],"calculating":[172],"elements,":[177],"formed":[183],"by":[184],"weighted":[186],"sum":[187],"elements.":[193],"Experiment":[194],"results":[195],"show":[196],"proposed":[199],"method":[201],"outperforms":[202],"classic":[204],"methods":[205],"like":[206],"LDA":[207],"doc2vec.":[209]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
