{"id":"https://openalex.org/W4406461921","doi":"https://doi.org/10.1109/bigdata62323.2024.10825415","title":"Enriching Skill Taxonomies through Vector Space Models","display_name":"Enriching Skill Taxonomies through Vector Space Models","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406461921","doi":"https://doi.org/10.1109/bigdata62323.2024.10825415"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825415","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825415","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102781905","display_name":"Simone D\u2019Amico","orcid":"https://orcid.org/0009-0002-2820-0277"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Simone D\u2019Amico","raw_affiliation_strings":["University of Milano-Bicocca,CRISP Research Centre,Italy"],"affiliations":[{"raw_affiliation_string":"University of Milano-Bicocca,CRISP Research Centre,Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056749454","display_name":"Alessia De Santo","orcid":null},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessia De Santo","raw_affiliation_strings":["University of Milano-Bicocca,CRISP Research Centre,Italy"],"affiliations":[{"raw_affiliation_string":"University of Milano-Bicocca,CRISP Research Centre,Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047827615","display_name":"Fabio Mercorio","orcid":"https://orcid.org/0000-0001-6864-2702"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Fabio Mercorio","raw_affiliation_strings":["University of Milano-Bicocca,CRISP Research Centre,Italy"],"affiliations":[{"raw_affiliation_string":"University of Milano-Bicocca,CRISP Research Centre,Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039716498","display_name":"Mario Mezzanzanica","orcid":"https://orcid.org/0000-0003-0399-2810"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mario Mezzanzanica","raw_affiliation_strings":["University of Milano-Bicocca,CRISP Research Centre,Italy"],"affiliations":[{"raw_affiliation_string":"University of Milano-Bicocca,CRISP Research Centre,Italy","institution_ids":["https://openalex.org/I66752286"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102781905"],"corresponding_institution_ids":["https://openalex.org/I66752286"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27158176,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2297","last_page":"2302"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6660711765289307},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5978594422340393},{"id":"https://openalex.org/keywords/vector-space","display_name":"Vector space","score":0.49962520599365234},{"id":"https://openalex.org/keywords/vector","display_name":"Vector (molecular biology)","score":0.48170286417007446},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41771888732910156},{"id":"https://openalex.org/keywords/vector-space-model","display_name":"Vector space model","score":0.41493749618530273},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3331044018268585},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3232484459877014},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14388501644134521}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6660711765289307},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5978594422340393},{"id":"https://openalex.org/C13336665","wikidata":"https://www.wikidata.org/wiki/Q125977","display_name":"Vector space","level":2,"score":0.49962520599365234},{"id":"https://openalex.org/C92087593","wikidata":"https://www.wikidata.org/wiki/Q427389","display_name":"Vector (molecular biology)","level":4,"score":0.48170286417007446},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41771888732910156},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.41493749618530273},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3331044018268585},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3232484459877014},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14388501644134521},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C40767141","wikidata":"https://www.wikidata.org/wiki/Q285697","display_name":"Recombinant DNA","level":3,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825415","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825415","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},{"id":"pmh:oai:boa.unimib.it:10281/534462","is_oa":false,"landing_page_url":"https://hdl.handle.net/10281/534462","pdf_url":null,"source":{"id":"https://openalex.org/S4306401259","display_name":"BOA (University of Milano-Bicocca)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66752286","host_organization_name":"University of Milano-Bicocca","host_organization_lineage":["https://openalex.org/I66752286"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2798965707","https://openalex.org/W2883153670","https://openalex.org/W2896457183","https://openalex.org/W2962992134","https://openalex.org/W2970597249","https://openalex.org/W3012615229","https://openalex.org/W3012823870","https://openalex.org/W3036762099","https://openalex.org/W3105298925","https://openalex.org/W3114918172","https://openalex.org/W3212837704","https://openalex.org/W4211076749","https://openalex.org/W4221153270","https://openalex.org/W4297035741","https://openalex.org/W4312833999","https://openalex.org/W4386576685","https://openalex.org/W4399511904","https://openalex.org/W4400488119","https://openalex.org/W6784923235","https://openalex.org/W6802012755","https://openalex.org/W6849760658","https://openalex.org/W6869227218","https://openalex.org/W6870135743"],"related_works":["https://openalex.org/W2096728994","https://openalex.org/W2349139068","https://openalex.org/W1974406477","https://openalex.org/W3161401723","https://openalex.org/W1540114765","https://openalex.org/W105748137","https://openalex.org/W2391634343","https://openalex.org/W1966027089","https://openalex.org/W2362958218","https://openalex.org/W1883708690"],"abstract_inverted_index":{"Hierarchical":[0],"taxonomies":[1,70],"serve":[2],"as":[3,15,79,176,186],"fundamental":[4],"structures":[5],"for":[6,87,122,200,220],"reasoning":[7],"with":[8,58,100,111,142,153,167],"hierarchical":[9,98],"concepts":[10,39],"across":[11],"various":[12],"domains":[13],"such":[14],"healthcare,":[16],"finance,":[17],"and":[18,24,29,36,116,202],"economy.":[19],"However,":[20],"maintaining":[21],"their":[22],"relevance":[23],"accuracy":[25],"is":[26],"a":[27,48,66,90,182,231,238],"labor-intensive":[28],"error-prone":[30],"task,":[31],"demanding":[32],"experts":[33,175],"to":[34,55,68,93,114,134],"identify":[35,115],"revise":[37],"novel":[38],"constantly.":[40],"In":[41,61],"this":[42],"context,":[43],"distributional":[44],"semantics":[45],"techniques":[46],"offer":[47],"promising":[49],"avenue":[50],"by":[51,71,173],"suggesting":[52],"terms":[53,74,102,121,145,162,170],"likely":[54],"be":[56],"associated":[57],"existing":[59],"concepts.":[60],"our":[62,228],"study,":[63],"we":[64,108],"propose":[65],"method":[67],"enhance":[69],"adding":[72],"related":[73],"using":[75,103,234],"contextual":[76],"word":[77],"embedding":[78],"encoders.":[80],"We":[81,223],"introduce":[82],"VESPATE":[83,110,127,213],"(VEctor":[84],"SPAce":[85],"model":[86],"Taxonomy":[88],"Enrichment),":[89],"system":[91,229],"designed":[92],"automatically":[94],"expand":[95],"any":[96],"given":[97],"taxonomy":[99,207],"new":[101,169],"three":[104,247],"generative":[105,195],"models.":[106,248],"Additionally,":[107,209],"integrate":[109],"human":[112,217],"validation":[113],"select":[117],"the":[118,125,136,148,191,194,198,210,216,221,225],"most":[119],"suitable":[120],"inclusion":[123],"in":[124,206],"taxonomy.":[126],"was":[128],"deployed":[129],"within":[130],"an":[131],"EU":[132],"project":[133],"enrich":[135],"official":[137],"European":[138],"Skill":[139],"taxonomy,":[140],"ESCO,":[141],"40K+":[143],"digital":[144],"gathered":[146],"from":[147],"Web,":[149],"aligning":[150],"ESCO":[151],"skills":[152],"current":[154],"labor":[155],"market":[156],"needs.":[157],"A":[158],"total":[159],"of":[160,184,193,212,227],"924":[161],"were":[163],"selected":[164],"through":[165],"VESPATE,":[166],"757":[168],"subsequently":[171],"validated":[172],"domain":[174],"correctly":[177],"matched.":[178],"Our":[179],"framework,":[180],"employing":[181],"pool":[183],"LLMs":[185],"encoders,":[187],"helped":[188],"us":[189],"mitigate":[190],"limitations":[192],"model,":[196],"reducing":[197],"potential":[199],"errors":[201],"ensuring":[203],"precise":[204],"results":[205],"enrichment.":[208],"implementation":[211],"consistently":[214],"decreased":[215],"effort":[218],"required":[219],"project.":[222],"evaluated":[224],"robustness":[226],"against":[230],"baseline":[232],"constructed":[233],"ESCO\u2019s":[235],"hierarchy,":[236],"achieving":[237],"81%":[239],"Positive":[240],"Predictive":[241],"Value":[242],"(PPV)":[243],"when":[244],"combining":[245],"all":[246]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
