{"id":"https://openalex.org/W2743391579","doi":"https://doi.org/10.1145/3106426.3109035","title":"A language modelling approach for discovering novel labour market occupations from the web","display_name":"A language modelling approach for discovering novel labour market occupations from the web","publication_year":2017,"publication_date":"2017-08-10","ids":{"openalex":"https://openalex.org/W2743391579","doi":"https://doi.org/10.1145/3106426.3109035","mag":"2743391579"},"language":"en","primary_location":{"id":"doi:10.1145/3106426.3109035","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3106426.3109035","pdf_url":null,"source":{"id":"https://openalex.org/S4306524158","display_name":"Proceedings of the International Conference on Web Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on Web Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078112922","display_name":"Stefania Marrara","orcid":"https://orcid.org/0000-0003-2745-3539"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Stefania Marrara","raw_affiliation_strings":["DISCo - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DISCo - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066756066","display_name":"Gabriella Pasi","orcid":"https://orcid.org/0000-0002-6080-8170"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Gabriella Pasi","raw_affiliation_strings":["DISCo - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DISCo - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074645479","display_name":"Marco Viviani","orcid":"https://orcid.org/0000-0002-2274-9050"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Viviani","raw_affiliation_strings":["DISCo - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DISCo - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049259722","display_name":"Mirko Cesarini","orcid":"https://orcid.org/0000-0001-9601-0403"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mirko Cesarini","raw_affiliation_strings":["DiSMeQ - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DiSMeQ - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047827615","display_name":"Fabio Mercorio","orcid":"https://orcid.org/0000-0001-6864-2702"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Fabio Mercorio","raw_affiliation_strings":["DiSMeQ - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DiSMeQ - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039716498","display_name":"Mario Mezzanzanica","orcid":"https://orcid.org/0000-0003-0399-2810"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mario Mezzanzanica","raw_affiliation_strings":["DiSMeQ - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DiSMeQ - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016785133","display_name":"M. Pappagallo","orcid":"https://orcid.org/0000-0001-7601-5602"},"institutions":[{"id":"https://openalex.org/I66752286","display_name":"University of Milano-Bicocca","ror":"https://ror.org/01ynf4891","country_code":"IT","type":"education","lineage":["https://openalex.org/I66752286"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Pappagallo","raw_affiliation_strings":["DISCo - University of Milano-Bicocca, Milan, Italy"],"affiliations":[{"raw_affiliation_string":"DISCo - University of Milano-Bicocca, Milan, Italy","institution_ids":["https://openalex.org/I66752286"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5078112922"],"corresponding_institution_ids":["https://openalex.org/I66752286"],"apc_list":null,"apc_paid":null,"fwci":0.7269,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.78680065,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1026","last_page":"1034"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/taxonomy","display_name":"Taxonomy (biology)","score":0.7156559228897095},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6146899461746216},{"id":"https://openalex.org/keywords/agency","display_name":"Agency (philosophy)","score":0.585658073425293},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5581007599830627},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.5115700364112854},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.49211734533309937},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34214532375335693},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.34197407960891724},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.33576464653015137},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3321087956428528},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.32528066635131836},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.21643579006195068},{"id":"https://openalex.org/keywords/sociology","display_name":"Sociology","score":0.21438032388687134},{"id":"https://openalex.org/keywords/social-science","display_name":"Social science","score":0.11291065812110901}],"concepts":[{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.7156559228897095},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6146899461746216},{"id":"https://openalex.org/C108170787","wikidata":"https://www.wikidata.org/wiki/Q3951828","display_name":"Agency (philosophy)","level":2,"score":0.585658073425293},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5581007599830627},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.5115700364112854},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.49211734533309937},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34214532375335693},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.34197407960891724},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.33576464653015137},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3321087956428528},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.32528066635131836},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.21643579006195068},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.21438032388687134},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.11291065812110901},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3106426.3109035","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3106426.3109035","pdf_url":null,"source":{"id":"https://openalex.org/S4306524158","display_name":"Proceedings of the International Conference on Web Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the International Conference on Web Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:boa.unimib.it:10281/168475","is_oa":false,"landing_page_url":"http://hdl.handle.net/10281/168475","pdf_url":null,"source":{"id":"https://openalex.org/S4306401259","display_name":"BOA (University of Milano-Bicocca)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66752286","host_organization_name":"University of Milano-Bicocca","host_organization_lineage":["https://openalex.org/I66752286"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.7599999904632568,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W628792916","https://openalex.org/W1611041715","https://openalex.org/W1631260214","https://openalex.org/W1904228841","https://openalex.org/W1963617357","https://openalex.org/W1985096808","https://openalex.org/W2003800060","https://openalex.org/W2016871293","https://openalex.org/W2068905009","https://openalex.org/W2070791591","https://openalex.org/W2092271315","https://openalex.org/W2093390569","https://openalex.org/W2097927681","https://openalex.org/W2136542423","https://openalex.org/W2136583886","https://openalex.org/W2142069714","https://openalex.org/W2152263452","https://openalex.org/W2167619573","https://openalex.org/W2240123196","https://openalex.org/W2251343465","https://openalex.org/W2619083728","https://openalex.org/W2950186769","https://openalex.org/W4206765718","https://openalex.org/W4240913316","https://openalex.org/W4243333943","https://openalex.org/W6636811518"],"related_works":["https://openalex.org/W3167258865","https://openalex.org/W4210357677","https://openalex.org/W2094117429","https://openalex.org/W1564472341","https://openalex.org/W2213259971","https://openalex.org/W2898732673","https://openalex.org/W2323552265","https://openalex.org/W4389797989","https://openalex.org/W2410053581","https://openalex.org/W2516596904"],"abstract_inverted_index":{"This":[0,23],"article":[1],"presents":[2],"an":[3],"approach":[4],"for":[5,41],"the":[6,18,28,32,37,42,53],"identification":[7],"of":[8,31,39],"potential":[9],"new":[10],"occupations,":[11],"i.e.,":[12],"professions,":[13],"not":[14],"yet":[15],"codified":[16],"by":[17,36,56],"international":[19],"standard":[20],"taxonomy":[21,55],"ISCO.":[22],"work":[24],"is":[25],"framed":[26],"within":[27],"research":[29],"activities":[30],"WoLMIS":[33],"project,":[34],"developed":[35],"University":[38],"Milano-Bicocca":[40],"CEDEFOP":[43],"European":[44],"Agency,":[45],"which":[46],"classifies":[47],"on-line":[48],"job":[49],"offers":[50],"according":[51],"to":[52],"ISCO":[54],"using":[57],"machine":[58],"learning":[59],"techniques.":[60]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
