{"id":"https://openalex.org/W7134187065","doi":"https://doi.org/10.1109/bigdata66926.2025.11402454","title":"JobHop: A Large-Scale Dataset of Career Trajectories","display_name":"JobHop: A Large-Scale Dataset of Career Trajectories","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W7134187065","doi":"https://doi.org/10.1109/bigdata66926.2025.11402454"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata66926.2025.11402454","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata66926.2025.11402454","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/1854/LU-01KK9G9E4499JX8RRS67GW1JRH","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114618077","display_name":"Iman Johary","orcid":null},"institutions":[{"id":"https://openalex.org/I32597200","display_name":"Ghent University","ror":"https://ror.org/00cv9y106","country_code":"BE","type":"education","lineage":["https://openalex.org/I32597200"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Iman Johary","raw_affiliation_strings":["Ghent University,AIDA-IDLab,Department of Electronics and Information Systems"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ghent University,AIDA-IDLab,Department of Electronics and Information Systems","institution_ids":["https://openalex.org/I32597200"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046853585","display_name":"R. Romero","orcid":"https://orcid.org/0000-0002-3573-988X"},"institutions":[{"id":"https://openalex.org/I32597200","display_name":"Ghent University","ror":"https://ror.org/00cv9y106","country_code":"BE","type":"education","lineage":["https://openalex.org/I32597200"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Rapha\u00ebl Romero","raw_affiliation_strings":["Ghent University,AIDA-IDLab,Department of Electronics and Information Systems"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ghent University,AIDA-IDLab,Department of Electronics and Information Systems","institution_ids":["https://openalex.org/I32597200"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077156975","display_name":"Alexandru Mara","orcid":"https://orcid.org/0000-0001-8358-9997"},"institutions":[{"id":"https://openalex.org/I32597200","display_name":"Ghent University","ror":"https://ror.org/00cv9y106","country_code":"BE","type":"education","lineage":["https://openalex.org/I32597200"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Alexandru C. Mara","raw_affiliation_strings":["Ghent University,AIDA-IDLab,Department of Electronics and Information Systems"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ghent University,AIDA-IDLab,Department of Electronics and Information Systems","institution_ids":["https://openalex.org/I32597200"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123910163","display_name":"Tijl De Bie","orcid":null},"institutions":[{"id":"https://openalex.org/I32597200","display_name":"Ghent University","ror":"https://ror.org/00cv9y106","country_code":"BE","type":"education","lineage":["https://openalex.org/I32597200"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Tijl De Bie","raw_affiliation_strings":["Ghent University,AIDA-IDLab,Department of Electronics and Information Systems"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ghent University,AIDA-IDLab,Department of Electronics and Information Systems","institution_ids":["https://openalex.org/I32597200"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.7731508,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2184","last_page":"2191"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.08060000091791153,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.08060000091791153,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10726","display_name":"Career Development and Diversity","score":0.06909999996423721,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.06560000032186508,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.28619998693466187},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.27570000290870667},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.26829999685287476},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.25600001215934753},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.2531999945640564}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4366999864578247},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3084000051021576},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.28619998693466187},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2425999939441681},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.23999999463558197},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2273000031709671}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/bigdata66926.2025.11402454","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata66926.2025.11402454","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},{"id":"pmh:oai:archive.ugent.be:01KK9G9E4499JX8RRS67GW1JRH","is_oa":true,"landing_page_url":"http://hdl.handle.net/1854/LU-01KK9G9E4499JX8RRS67GW1JRH","pdf_url":null,"source":{"id":"https://openalex.org/S4306400478","display_name":"Ghent University Academic Bibliography (Ghent University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I32597200","host_organization_name":"Ghent University","host_organization_lineage":["https://openalex.org/I32597200"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISBN: 9798331594473","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"pmh:oai:archive.ugent.be:01KK9G9E4499JX8RRS67GW1JRH","is_oa":true,"landing_page_url":"http://hdl.handle.net/1854/LU-01KK9G9E4499JX8RRS67GW1JRH","pdf_url":null,"source":{"id":"https://openalex.org/S4306400478","display_name":"Ghent University Academic Bibliography (Ghent University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I32597200","host_organization_name":"Ghent University","host_organization_lineage":["https://openalex.org/I32597200"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISBN: 9798331594473","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.44405028223991394,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1608335717","https://openalex.org/W1919900543","https://openalex.org/W2613228905","https://openalex.org/W2756268972","https://openalex.org/W2797753066","https://openalex.org/W2897356390","https://openalex.org/W2900868419","https://openalex.org/W4221057462","https://openalex.org/W4285174074","https://openalex.org/W4291158197","https://openalex.org/W4378529999","https://openalex.org/W4388559609","https://openalex.org/W4391893125","https://openalex.org/W4393065950","https://openalex.org/W4395008902","https://openalex.org/W4406458149","https://openalex.org/W4408854165"],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"labor":[1,119,166],"market":[2,120,167],"dynamics":[3],"is":[4,62],"essential":[5],"for":[6,164],"policymakers,":[7],"employers,":[8],"and":[9,89,97,124,139,158],"job":[10,122,154,159],"seekers.":[11],"However,":[12],"comprehensive":[13],"datasets":[14],"that":[15],"capture":[16],"real-world":[17,108],"career":[18,59,128,136,156],"trajectories":[19],"are":[20],"scarce.":[21],"In":[22],"this":[23],"paper,":[24],"we":[25,51,148],"introduce":[26],"JobHop,":[27],"a":[28,71,78],"large-scale":[29],"public":[30,40],"dataset":[31,80,112,151],"derived":[32],"from":[33,88],"anonymized":[34],"resumes":[35,96],"provided":[36],"by":[37],"VDAB,":[38],"the":[39,125],"employment":[41],"service":[42],"in":[43,77],"Flanders,":[44],"Belgium.":[45],"Utilizing":[46],"Large":[47],"Language":[48],"Models":[49],"(LLMs),":[50],"process":[52],"unstructured":[53],"resume":[54],"data":[55],"to":[56,65,99],"extract":[57],"structured":[58],"information,":[60],"which":[61],"then":[63],"normalized":[64],"standardized":[66,100],"ESCO":[67,101],"occupation":[68,102],"codes":[69],"using":[70],"multi-label":[72],"classification":[73],"model.":[74],"This":[75,111],"results":[76],"rich":[79],"of":[81,127],"over":[82],"1.67":[83],"million":[84],"work":[85],"experiences,":[86],"extracted":[87],"grouped":[90],"into":[91,107],"more":[92],"than":[93],"361,000":[94],"user":[95],"mapped":[98],"codes,":[103],"offering":[104],"valuable":[105],"insights":[106],"occupational":[109,131],"transitions.":[110,132],"enables":[113],"diverse":[114],"applications,":[115],"such":[116],"as":[117],"analyzing":[118],"mobility,":[121],"stability,":[123],"effects":[126],"breaks":[129],"on":[130],"It":[133],"also":[134],"supports":[135],"path":[137],"prediction":[138],"other":[140],"data-driven":[141],"decision-making":[142],"processes.":[143],"To":[144],"illustrate":[145],"its":[146,162],"potential,":[147],"explore":[149],"key":[150],"characteristics,":[152],"including":[153],"distributions,":[155],"breaks,":[157],"transitions,":[160],"demonstrating":[161],"value":[163],"advancing":[165],"research.":[168]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-09T00:00:00"}
