{"id":"https://openalex.org/W2991598420","doi":"https://doi.org/10.26615/978-954-452-056-4_134","title":"Comparison of Machine Learning Approaches for Industry Classification Based on Textual Descriptions of Companies","display_name":"Comparison of Machine Learning Approaches for Industry Classification Based on Textual Descriptions of Companies","publication_year":2019,"publication_date":"2019-10-22","ids":{"openalex":"https://openalex.org/W2991598420","doi":"https://doi.org/10.26615/978-954-452-056-4_134","mag":"2991598420"},"language":"en","primary_location":{"id":"doi:10.26615/978-954-452-056-4_134","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-056-4_134","pdf_url":"https://doi.org/10.26615/978-954-452-056-4_134","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings - Natural Language Processing in a Deep Learning World","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.26615/978-954-452-056-4_134","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Sirma AI trading as Ontotext, Bulgara","orcid":null},"institutions":[{"id":"https://openalex.org/I24768866","display_name":"Bulgarian Academy of Sciences","ror":"https://ror.org/01x8hew03","country_code":"BG","type":"government","lineage":["https://openalex.org/I24768866"]},{"id":"https://openalex.org/I4210163063","display_name":"Institute of Information and Communication Technologies","ror":"https://ror.org/05fpsjc82","country_code":"BG","type":"facility","lineage":["https://openalex.org/I24768866","https://openalex.org/I4210163063"]}],"countries":["BG"],"is_corresponding":true,"raw_author_name":"Sirma AI trading as Ontotext, Bulgara","raw_affiliation_strings":["Institute of Information and Communication Technologies, Bulgarian Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Information and Communication Technologies, Bulgarian Academy of Sciences","institution_ids":["https://openalex.org/I4210163063","https://openalex.org/I24768866"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026648166","display_name":"Andrey Tagarev","orcid":"https://orcid.org/0000-0003-4262-7277"},"institutions":[{"id":"https://openalex.org/I24768866","display_name":"Bulgarian Academy of Sciences","ror":"https://ror.org/01x8hew03","country_code":"BG","type":"government","lineage":["https://openalex.org/I24768866"]},{"id":"https://openalex.org/I4210163063","display_name":"Institute of Information and Communication Technologies","ror":"https://ror.org/05fpsjc82","country_code":"BG","type":"facility","lineage":["https://openalex.org/I24768866","https://openalex.org/I4210163063"]}],"countries":["BG"],"is_corresponding":false,"raw_author_name":"Andrey Tagarev","raw_affiliation_strings":["Institute of Information and Communication Technologies, Bulgarian Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Information and Communication Technologies, Bulgarian Academy of Sciences","institution_ids":["https://openalex.org/I4210163063","https://openalex.org/I24768866"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083253268","display_name":"Nikola Tulechki","orcid":"https://orcid.org/0000-0002-7318-1637"},"institutions":[{"id":"https://openalex.org/I24768866","display_name":"Bulgarian Academy of Sciences","ror":"https://ror.org/01x8hew03","country_code":"BG","type":"government","lineage":["https://openalex.org/I24768866"]},{"id":"https://openalex.org/I4210163063","display_name":"Institute of Information and Communication Technologies","ror":"https://ror.org/05fpsjc82","country_code":"BG","type":"facility","lineage":["https://openalex.org/I24768866","https://openalex.org/I4210163063"]}],"countries":["BG"],"is_corresponding":false,"raw_author_name":"Nikola Tulechki","raw_affiliation_strings":["Institute of Information and Communication Technologies, Bulgarian Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Information and Communication Technologies, Bulgarian Academy of Sciences","institution_ids":["https://openalex.org/I4210163063","https://openalex.org/I24768866"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Sirma AI trading as Ontotext, Bulgara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sirma AI trading as Ontotext, Bulgara","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044704545","display_name":"Svetla Boytcheva","orcid":"https://orcid.org/0000-0002-5542-9168"},"institutions":[{"id":"https://openalex.org/I24768866","display_name":"Bulgarian Academy of Sciences","ror":"https://ror.org/01x8hew03","country_code":"BG","type":"government","lineage":["https://openalex.org/I24768866"]},{"id":"https://openalex.org/I4210163063","display_name":"Institute of Information and Communication Technologies","ror":"https://ror.org/05fpsjc82","country_code":"BG","type":"facility","lineage":["https://openalex.org/I24768866","https://openalex.org/I4210163063"]}],"countries":["BG"],"is_corresponding":false,"raw_author_name":"Svetla Boytcheva","raw_affiliation_strings":["Institute of Information and Communication Technologies, Bulgarian Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Information and Communication Technologies, Bulgarian Academy of Sciences","institution_ids":["https://openalex.org/I4210163063","https://openalex.org/I24768866"]}]},{"author_position":"last","author":{"id":null,"display_name":"Sirma AI trading as Ontotext, Bulgara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sirma AI trading as Ontotext, Bulgara","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I24768866","https://openalex.org/I4210163063"],"apc_list":null,"apc_paid":null,"fwci":0.578,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.76779187,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1169","last_page":"1175"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7585859298706055},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.6662523150444031},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6072304248809814},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5629405975341797},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.43748411536216736},{"id":"https://openalex.org/keywords/classification-scheme","display_name":"Classification scheme","score":0.42285650968551636},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3811595141887665},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3799641728401184},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1459033191204071}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7585859298706055},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.6662523150444031},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6072304248809814},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5629405975341797},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43748411536216736},{"id":"https://openalex.org/C13460635","wikidata":"https://www.wikidata.org/wiki/Q85753676","display_name":"Classification scheme","level":2,"score":0.42285650968551636},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3811595141887665},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3799641728401184},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1459033191204071},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.26615/978-954-452-056-4_134","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-056-4_134","pdf_url":"https://doi.org/10.26615/978-954-452-056-4_134","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings - Natural Language Processing in a Deep Learning World","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.26615/978-954-452-056-4_134","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-056-4_134","pdf_url":"https://doi.org/10.26615/978-954-452-056-4_134","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings - Natural Language Processing in a Deep Learning World","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5899999737739563,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G453067482","display_name":null,"funder_award_id":"014-2020","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"},{"id":"https://openalex.org/G5634946813","display_name":null,"funder_award_id":"2014-2020","funder_id":"https://openalex.org/F4320335322","funder_display_name":"European Regional Development Fund"}],"funders":[{"id":"https://openalex.org/F4320335322","display_name":"European Regional Development Fund","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2991598420.pdf","grobid_xml":"https://content.openalex.org/works/W2991598420.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W202303397","https://openalex.org/W1484485089","https://openalex.org/W1486649854","https://openalex.org/W1550206324","https://openalex.org/W1562615108","https://openalex.org/W1570978137","https://openalex.org/W1600295424","https://openalex.org/W1614298861","https://openalex.org/W1826790618","https://openalex.org/W1879009681","https://openalex.org/W1995258314","https://openalex.org/W1996514462","https://openalex.org/W2044933868","https://openalex.org/W2113461044","https://openalex.org/W2121082043","https://openalex.org/W2147880316","https://openalex.org/W2149684865","https://openalex.org/W2151595407","https://openalex.org/W2166183437","https://openalex.org/W2171444767","https://openalex.org/W2250539671","https://openalex.org/W2254361154","https://openalex.org/W2896457183","https://openalex.org/W2942203175","https://openalex.org/W2950577311","https://openalex.org/W2962739339","https://openalex.org/W2963026768","https://openalex.org/W2963341956","https://openalex.org/W2963908579","https://openalex.org/W2964110616","https://openalex.org/W2970597249","https://openalex.org/W3103900065","https://openalex.org/W3105625590","https://openalex.org/W4234200468","https://openalex.org/W4234849553"],"related_works":["https://openalex.org/W855278477","https://openalex.org/W2409268345","https://openalex.org/W2370299578","https://openalex.org/W1581172184","https://openalex.org/W2484602794","https://openalex.org/W2033101018","https://openalex.org/W2961085424","https://openalex.org/W2134732314","https://openalex.org/W2099278314","https://openalex.org/W2394886764"],"abstract_inverted_index":{"This":[0],"paper":[1],"addresses":[2],"the":[3,51],"task":[4],"of":[5,15,50],"categorizing":[6],"companies":[7,19],"within":[8],"industry":[9],"classification":[10,26,54],"schemes.":[11],"The":[12,24],"dataset":[13],"consists":[14],"encyclopedic":[16],"articles":[17],"about":[18],"and":[20,61],"their":[21],"economic":[22],"activities.":[23],"target":[25],"schema":[27],"is":[28],"build":[29],"by":[30],"mapping":[31],"linked":[32],"open":[33],"data":[34],"in":[35],"a":[36],"semi-supervised":[37],"manner.":[38],"Target":[39],"classes":[40],"are":[41],"built":[42],"bottom-up":[43],"from":[44],"DBpedia.":[45],"We":[46],"apply":[47],"several":[48],"state":[49],"art":[52],"text":[53],"techniques,":[55],"based":[56],"both":[57],"on":[58],"deep":[59],"learning":[60],"classical":[62],"vectorspace":[63],"models.":[64]},"counts_by_year":[{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2019-12-05T00:00:00"}
