{"id":"https://openalex.org/W2604673238","doi":"https://doi.org/10.1109/lsp.2017.2690599","title":"New Word Extraction From Chinese Financial Documents","display_name":"New Word Extraction From Chinese Financial Documents","publication_year":2017,"publication_date":"2017-04-03","ids":{"openalex":"https://openalex.org/W2604673238","doi":"https://doi.org/10.1109/lsp.2017.2690599","mag":"2604673238"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2017.2690599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2017.2690599","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113743714","display_name":"Liwei Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liwei Yan","raw_affiliation_strings":["Tsinghua National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001405009","display_name":"Bo Bai","orcid":"https://orcid.org/0000-0003-4796-8249"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Bai","raw_affiliation_strings":["Future Network Theory Lab, Huawei Technologies Co. Ltd., Shatin, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Future Network Theory Lab, Huawei Technologies Co. Ltd., Shatin, Hong Kong","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108049716","display_name":"Wei Chen","orcid":"https://orcid.org/0000-0002-9066-1448"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Chen","raw_affiliation_strings":["Tsinghua National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001469325","display_name":"Dapeng Wu","orcid":"https://orcid.org/0000-0003-1755-0183"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dapeng Oliver Wu","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Florida, Gainesville, FL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Florida, Gainesville, FL, USA","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5113743714"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.5851,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.74482665,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":"24","issue":"6","first_page":"770","last_page":"773"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.9704999923706055,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.9276999831199646,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8294477462768555},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.665662944316864},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6207267045974731},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6181532740592957},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.6040985584259033},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5736187100410461},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5579304695129395},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.53760826587677},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4761752486228943},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.4733928442001343},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4724709689617157},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.4482821524143219},{"id":"https://openalex.org/keywords/keyword-extraction","display_name":"Keyword extraction","score":0.41664573550224304},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.39893779158592224},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.08035153150558472}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8294477462768555},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.665662944316864},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6207267045974731},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6181532740592957},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.6040985584259033},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5736187100410461},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5579304695129395},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.53760826587677},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4761752486228943},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.4733928442001343},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4724709689617157},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.4482821524143219},{"id":"https://openalex.org/C2780288562","wikidata":"https://www.wikidata.org/wiki/Q25053353","display_name":"Keyword extraction","level":2,"score":0.41664573550224304},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.39893779158592224},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.08035153150558472},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2017.2690599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2017.2690599","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5299999713897705,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[{"id":"https://openalex.org/G8896799008","display_name":null,"funder_award_id":"61401249","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1493309334","https://openalex.org/W1560601000","https://openalex.org/W1568297139","https://openalex.org/W2041412237","https://openalex.org/W2096301385","https://openalex.org/W2138151602","https://openalex.org/W2142937697","https://openalex.org/W2147102537","https://openalex.org/W2153635508","https://openalex.org/W2154756108","https://openalex.org/W2159591557","https://openalex.org/W3010180081","https://openalex.org/W6633469971","https://openalex.org/W6681770459"],"related_works":["https://openalex.org/W2351671768","https://openalex.org/W2004087619","https://openalex.org/W2469016277","https://openalex.org/W2557094866","https://openalex.org/W2757101400","https://openalex.org/W2362196274","https://openalex.org/W1982302668","https://openalex.org/W1990527953","https://openalex.org/W2240384024","https://openalex.org/W4283768689"],"abstract_inverted_index":{"With":[0],"the":[1,31,55,59,65],"tremendous":[2],"development":[3],"of":[4,19,67,99,103],"data":[5],"science,":[6],"using":[7],"unstructured":[8],"documents":[9],"to":[10,29,51],"analyze":[11],"marketing":[12],"dynamics":[13],"is":[14,35,58],"attracting":[15],"a":[16,37,80,97],"great":[17],"deal":[18],"attention.":[20],"In":[21,49],"this":[22],"letter,":[23],"we":[24],"propose":[25],"an":[26],"iterative":[27],"scheme":[28],"extract":[30],"new":[32],"words,":[33],"which":[34,105],"often":[36],"bottleneck":[38],"for":[39],"Chinese":[40],"natural":[41],"language":[42],"processing":[43],"(NLP)":[44],"in":[45],"financial":[46],"markets":[47],"analysis.":[48],"contrast":[50],"existing":[52],"static":[53],"features,":[54],"key":[56],"novelty":[57],"proposed":[60],"dynamic":[61],"features":[62],"that":[63],"characterize":[64],"similarity":[66],"context":[68,74],"patterns.":[69],"Via":[70],"iteration,":[71],"distinguishable":[72],"seed":[73],"patterns":[75],"are":[76],"extracted.":[77],"Tested":[78],"on":[79],"203":[81],"MB":[82],"corpus,":[83],"19":[84],"291":[85],"words":[86],"representing":[87],"emerging":[88],"industries,":[89],"entities,":[90],"projects,":[91],"and":[92,101],"products":[93],"were":[94],"extracted":[95],"with":[96],"precision":[98],"89.8%":[100],"recall":[102],"88.9%,":[104],"outperforms":[106],"most":[107],"competitor":[108],"methods.":[109]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
