{"id":"https://openalex.org/W3007002238","doi":"https://doi.org/10.1109/bigdata47090.2019.9006438","title":"Peer Firm Identification Using Word Embeddings","display_name":"Peer Firm Identification Using Word Embeddings","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3007002238","doi":"https://doi.org/10.1109/bigdata47090.2019.9006438","mag":"3007002238"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata47090.2019.9006438","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata47090.2019.9006438","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082754828","display_name":"Taeyoung Kee","orcid":"https://orcid.org/0000-0003-4632-1312"},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":true,"raw_author_name":"Taeyoung Kee","raw_affiliation_strings":["Management Science, Aalto University School of Business, Helsinki, Finland"],"affiliations":[{"raw_affiliation_string":"Management Science, Aalto University School of Business, Helsinki, Finland","institution_ids":["https://openalex.org/I9927081"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5082754828"],"corresponding_institution_ids":["https://openalex.org/I9927081"],"apc_list":null,"apc_paid":null,"fwci":0.1443,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.61627301,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"2019","issue":null,"first_page":"5536","last_page":"5543"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9835000038146973,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9750000238418579,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.684474766254425},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6705794334411621},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6642832159996033},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.585096538066864},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5810904502868652},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.5741714239120483},{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.504254937171936},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5031399130821228},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4669440984725952},{"id":"https://openalex.org/keywords/homogeneous","display_name":"Homogeneous","score":0.46406206488609314},{"id":"https://openalex.org/keywords/vector-space-model","display_name":"Vector space model","score":0.44555097818374634},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.4349876642227173},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42017388343811035},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38304072618484497},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.1540859341621399},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14158329367637634}],"concepts":[{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.684474766254425},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6705794334411621},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6642832159996033},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.585096538066864},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5810904502868652},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.5741714239120483},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.504254937171936},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5031399130821228},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4669440984725952},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.46406206488609314},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.44555097818374634},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.4349876642227173},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42017388343811035},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38304072618484497},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.1540859341621399},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14158329367637634},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata47090.2019.9006438","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata47090.2019.9006438","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"mag:3042097161","is_oa":false,"landing_page_url":"https://jglobal.jst.go.jp/en/detail?JGLOBAL_ID=202002258156915623","pdf_url":null,"source":{"id":"https://openalex.org/S4306512817","display_name":"IEEE Conference Proceedings","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"IEEE Conference Proceedings","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.6100000143051147,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W8870360","https://openalex.org/W27071641","https://openalex.org/W1509222058","https://openalex.org/W1614298861","https://openalex.org/W1616194121","https://openalex.org/W1976912826","https://openalex.org/W2101095786","https://openalex.org/W2250539671","https://openalex.org/W2274159779","https://openalex.org/W2493916176","https://openalex.org/W2896457183","https://openalex.org/W2901530179","https://openalex.org/W2950577311","https://openalex.org/W2962739339","https://openalex.org/W2963341956","https://openalex.org/W3122311160","https://openalex.org/W3123123374","https://openalex.org/W3124462827","https://openalex.org/W3125104891","https://openalex.org/W3125370119","https://openalex.org/W6600367688","https://openalex.org/W6601085690","https://openalex.org/W6723250868","https://openalex.org/W6755207826"],"related_works":["https://openalex.org/W3011505626","https://openalex.org/W57923944","https://openalex.org/W3128481113","https://openalex.org/W2284045667","https://openalex.org/W960953481","https://openalex.org/W3109760095","https://openalex.org/W2056226831","https://openalex.org/W1598081081","https://openalex.org/W1823511492","https://openalex.org/W2981287881"],"abstract_inverted_index":{"In":[0,20,78],"the":[1,21,36,51,57,74,95,133,149,171],"task":[2],"of":[3,16,35,38,53,98,107,166],"peer":[4,85,117,134,167],"firm":[5,86,138],"identification,":[6],"researchers":[7],"have":[8],"relied":[9],"on":[10,90,103],"existing":[11,22,172],"industry":[12,23,76],"classification":[13,24,173],"system":[14],"regardless":[15,34],"their":[17,120],"critical":[18],"limitations.":[19],"system,":[25],"a":[26,83,104,113],"company":[27],"should":[28],"be":[29],"categorized":[30],"into":[31],"one":[32],"group":[33],"number":[37],"products":[39],"and":[40],"services":[41],"it":[42,45,66],"offers.":[43],"Furthermore,":[44],"is":[46],"not":[47,155],"possible":[48],"to":[49,56,70,128,170],"measure":[50],"similarity":[52,97,122],"companies":[54],"belonging":[55],"same":[58,150],"group.":[59],"The":[60],"systems":[61],"are":[62],"revised":[63],"manually,":[64],"rendering":[65],"difficult":[67],"for":[68],"them":[69],"keep":[71],"up":[72],"with":[73,119],"fast-changing":[75],"landscape.":[77],"this":[79],"paper,":[80],"we":[81,111],"propose":[82],"novel":[84],"identification":[87],"method":[88,114,160],"based":[89],"Word":[91,158],"2Vec.":[92],"By":[93],"computing":[94],"cosine":[96],"word":[99],"embedding":[100],"vectors":[101],"trained":[102],"10-year":[105],"corpus":[106],"financial":[108],"news":[109,143],"articles,":[110],"developed":[112],"that":[115,140],"produces":[116],"firms":[118,135,168],"numeric":[121],"scores.":[123],"Our":[124],"approach":[125],"allows":[126],"us":[127],"observe":[129],"chronological":[130],"changes":[131],"in":[132,142,148],"by":[136],"having":[137],"words":[139],"appear":[141],"articles":[144],"from":[145],"different":[146],"periods":[147],"vector":[151],"space.":[152],"Last":[153],"but":[154],"least,":[156],"our":[157],"2Vec-based":[159],"produced":[161],"more":[162],"economically":[163],"homogeneous":[164],"groups":[165],"compared":[169],"systems.":[174]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
