{"id":"https://openalex.org/W1986216695","doi":"https://doi.org/10.1177/0165551512442481","title":"A new method to compose long unknown Chinese keywords","display_name":"A new method to compose long unknown Chinese keywords","publication_year":2012,"publication_date":"2012-06-06","ids":{"openalex":"https://openalex.org/W1986216695","doi":"https://doi.org/10.1177/0165551512442481","mag":"1986216695"},"language":"en","primary_location":{"id":"doi:10.1177/0165551512442481","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551512442481","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035518545","display_name":"Yu\u2010Chin Liu","orcid":"https://orcid.org/0000-0002-2082-9647"},"institutions":[{"id":"https://openalex.org/I68348662","display_name":"Shih Hsin University","ror":"https://ror.org/03ynprv96","country_code":"TW","type":"education","lineage":["https://openalex.org/I68348662"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Yu-Chin Liu","raw_affiliation_strings":["Shih Hsin University, Taiwan, R.O.C","Shih-Hsin University , Taiwan , R.O.C"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shih Hsin University, Taiwan, R.O.C","institution_ids":["https://openalex.org/I68348662"]},{"raw_affiliation_string":"Shih-Hsin University , Taiwan , R.O.C","institution_ids":["https://openalex.org/I68348662"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042902868","display_name":"Chun\u2010Wei Lin","orcid":"https://orcid.org/0000-0003-0918-4961"},"institutions":[{"id":"https://openalex.org/I4210122179","display_name":"Wistron (Taiwan)","ror":"https://ror.org/02knfsk89","country_code":"TW","type":"company","lineage":["https://openalex.org/I4210122179"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chun-Wei Lin","raw_affiliation_strings":["Wistron Corporation, Taiwan, R.O.C"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wistron Corporation, Taiwan, R.O.C","institution_ids":["https://openalex.org/I4210122179"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5035518545"],"corresponding_institution_ids":["https://openalex.org/I68348662"],"apc_list":null,"apc_paid":null,"fwci":0.4421,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.71298735,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"38","issue":"4","first_page":"366","last_page":"382"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8604104518890381},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7485156655311584},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5987329483032227},{"id":"https://openalex.org/keywords/stop-words","display_name":"Stop words","score":0.5752459764480591},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5364428758621216},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5240186452865601},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.515975296497345},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5043517351150513},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4525248408317566},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.43535593152046204},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.42901021242141724},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4247104525566101},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.14122885465621948},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09140735864639282}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8604104518890381},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7485156655311584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5987329483032227},{"id":"https://openalex.org/C188338183","wikidata":"https://www.wikidata.org/wiki/Q80735","display_name":"Stop words","level":3,"score":0.5752459764480591},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5364428758621216},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5240186452865601},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.515975296497345},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5043517351150513},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4525248408317566},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.43535593152046204},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.42901021242141724},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4247104525566101},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.14122885465621948},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09140735864639282},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/0165551512442481","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551512442481","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7099999785423279,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W41384227","https://openalex.org/W109070363","https://openalex.org/W113111301","https://openalex.org/W130742730","https://openalex.org/W210954981","https://openalex.org/W1537636424","https://openalex.org/W1558333962","https://openalex.org/W1593045043","https://openalex.org/W1940278502","https://openalex.org/W1956559956","https://openalex.org/W2007709031","https://openalex.org/W2014020335","https://openalex.org/W2020498346","https://openalex.org/W2024032340","https://openalex.org/W2037164444","https://openalex.org/W2045628429","https://openalex.org/W2045879682","https://openalex.org/W2051885765","https://openalex.org/W2058982198","https://openalex.org/W2060234482","https://openalex.org/W2093424574","https://openalex.org/W2100259670","https://openalex.org/W2101449764","https://openalex.org/W2104884878","https://openalex.org/W2112378479","https://openalex.org/W2129287413","https://openalex.org/W2140156730","https://openalex.org/W2156632403","https://openalex.org/W2160735413","https://openalex.org/W2165612380","https://openalex.org/W2325227998","https://openalex.org/W2420187884","https://openalex.org/W2435251607","https://openalex.org/W2745750801","https://openalex.org/W2913736068","https://openalex.org/W2996160789","https://openalex.org/W4241850027","https://openalex.org/W4241982274","https://openalex.org/W4241992701","https://openalex.org/W4242870862","https://openalex.org/W4254025347"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4287688258","https://openalex.org/W3049211950","https://openalex.org/W4206165639","https://openalex.org/W2050712820","https://openalex.org/W2359738357"],"abstract_inverted_index":{"There":[0],"is":[1,23,53,80,175,211],"now":[2],"a":[3,27,117,133,172,214],"huge":[4],"amount":[5],"of":[6,29,41,49,139,233,246],"electronic":[7],"documents":[8,34,126],"stored":[9],"on":[10,38,166],"the":[11,39,47,105,137,147,155,167,179,218,237],"internet.":[12],"In":[13,44],"order":[14],"to":[15,73,98,102,115,177,227],"retrieve":[16],"information":[17,45],"from":[18,124,150],"this":[19],"data,":[20],"each":[21],"document":[22,160],"commonly":[24,81],"represented":[25],"as":[26,202],"set":[28,40],"keywords,":[30,171],"and":[31,153,170,221,241,251],"then":[32],"all":[33],"are":[35,62,94,187,200,225],"analysed":[36],"based":[37,165],"discriminative":[42],"words.":[43,76,111,184],"retrieval":[46],"recognition":[48],"words":[50,61,149,169,199,206,220,224],"in":[51,83],"articles":[52],"an":[54,190],"essential":[55],"step;":[56],"however,":[57],"unlike":[58],"English,":[59],"Chinese":[60,75,125],"not":[63,95],"distinguished":[64],"by":[65,127,189],"spaces.":[66],"Therefore,":[67],"many":[68],"approaches":[69],"have":[70],"been":[71],"devised":[72],"parse":[74,104],"The":[77,185,231],"dictionary-based":[78],"approach":[79],"used":[82,176],"most":[84],"current":[85],"systems":[86],"for":[87,120,181],"text":[88],"segmentation.":[89],"However,":[90],"general":[91],"purpose":[92],"dictionaries":[93],"always":[96],"able":[97],"provide":[99],"proper":[100],"references":[101],"accurately":[103],"domain-specific":[106,141],"words,":[107],"especially":[108],"with":[109,239],"unknown":[110,130,183,191,205],"This":[112],"paper":[113],"aims":[114],"propose":[116],"new":[118],"method":[119,144,255],"classifying":[121],"longer":[122],"keywords":[123,131,156],"incorporating":[128],"previously":[129],"into":[132],"keyword":[134],"list":[135],"without":[136],"effort":[138],"building":[140],"dictionaries.":[142],"Our":[143],"first":[145],"utilizes":[146],"parsed":[148,168,219],"existing":[151],"parsers":[152],"filters":[154],"utilizing":[157],"term":[158],"frequency\u2013inverse":[159],"frequency":[161],"(TF-IDF)":[162],"values;":[163],"further,":[164],"T":[173],"tree":[174],"store":[178],"candidates":[180,186],"composing":[182],"evaluated":[188],"word":[192],"(UW)":[193],"coefficient":[194,210],"threshold,":[195],"i.e.":[196],"newly":[197,203,222],"composed":[198,223],"deemed":[201],"discovered":[204],"if":[207],"their":[208],"UW":[209],"higher":[212],"than":[213],"pre-defined":[215],"threshold.":[216],"Finally,":[217],"re-filtered":[226],"form":[228],"long":[229],"keywords.":[230],"results":[232,238],"several":[234],"experiments":[235],"comparing":[236],"Google":[240],"Yahoo":[242],"show":[243],"that,":[244],"regardless":[245],"recall":[247],"rates,":[248],"precision":[249],"rates":[250],"F-measures,":[252],"our":[253],"proposed":[254],"significantly":[256],"outperforms":[257],"other":[258],"methods.":[259]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2026-05-05T06:06:40.768181","created_date":"2025-10-10T00:00:00"}
