{"id":"https://openalex.org/W7087731579","doi":"https://doi.org/10.18420/inf2025_86","title":"Automated classification of German job titles according to KldB: Challenges and novel methods","display_name":"Automated classification of German job titles according to KldB: Challenges and novel methods","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W7087731579","doi":"https://doi.org/10.18420/inf2025_86"},"language":"en","primary_location":{"id":"doi:10.18420/inf2025_86","is_oa":true,"landing_page_url":"https://doi.org/10.18420/inf2025_86","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article-journal"},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.18420/inf2025_86","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Dorau, Ralf","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dorau, Ralf","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Hein, Kristine","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hein, Kristine","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"D\u00f6rpinghaus, Jens","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"D\u00f6rpinghaus, Jens","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Tiemann, Michael","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tiemann, Michael","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.64395955,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T13776","display_name":"Phytochemical and Pharmacological Studies","score":0.06679999828338623,"subfield":{"id":"https://openalex.org/subfields/2707","display_name":"Complementary and alternative medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T13776","display_name":"Phytochemical and Pharmacological Studies","score":0.06679999828338623,"subfield":{"id":"https://openalex.org/subfields/2707","display_name":"Complementary and alternative medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T13526","display_name":"14-3-3 protein interactions","score":0.04439999908208847,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T13937","display_name":"Genetics, Bioinformatics, and Biomedical Research","score":0.024900000542402267,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/german","display_name":"German","score":0.7968999743461609},{"id":"https://openalex.org/keywords/vocational-education","display_name":"Vocational education","score":0.5012999773025513},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.4562999904155731},{"id":"https://openalex.org/keywords/synonym","display_name":"Synonym (taxonomy)","score":0.4323999881744385},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.3555000126361847},{"id":"https://openalex.org/keywords/job-analysis","display_name":"Job analysis","score":0.30869999527931213}],"concepts":[{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.7968999743461609},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6015999913215637},{"id":"https://openalex.org/C668760","wikidata":"https://www.wikidata.org/wiki/Q6869278","display_name":"Vocational education","level":2,"score":0.5012999773025513},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.4562999904155731},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4453999996185303},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43700000643730164},{"id":"https://openalex.org/C173483453","wikidata":"https://www.wikidata.org/wiki/Q1040689","display_name":"Synonym (taxonomy)","level":3,"score":0.4323999881744385},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.3555000126361847},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3431999981403351},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.31790000200271606},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.313400000333786},{"id":"https://openalex.org/C58346731","wikidata":"https://www.wikidata.org/wiki/Q627339","display_name":"Job analysis","level":3,"score":0.30869999527931213},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.3082999885082245},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2946999967098236},{"id":"https://openalex.org/C174954385","wikidata":"https://www.wikidata.org/wiki/Q6206740","display_name":"Job performance","level":3,"score":0.2856999933719635},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.27790001034736633},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2533000111579895}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18420/inf2025_86","is_oa":true,"landing_page_url":"https://doi.org/10.18420/inf2025_86","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"doi:10.18420/inf2025_86","is_oa":true,"landing_page_url":"https://doi.org/10.18420/inf2025_86","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article-journal"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.7261844277381897,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,20,115,145],"automated":[1],"classification":[2,25,106,180],"of":[3,10,26,35,64,112,117,139,150,160,179],"job":[4,28,78,154],"titles":[5,29,86,155],"constitutes":[6],"a":[7,39,62,73,176],"critical":[8],"component":[9],"labor":[11,196],"market":[12],"research,":[13],"survey":[14,71],"analysis,":[15],"and":[16,45,81,84,98,156,164,175],"administrative":[17],"data":[18,66],"processing.":[19],"present":[21,119],"study":[22,55,120],"explores":[23],"the":[24,32,43,105,113,118,137,148,158,184,194],"German":[27,33,195],"according":[30],"to":[31,51,103],"Classification":[34],"Occupations":[36],"(KldB),":[37],"with":[38],"particular":[40],"emphasis":[41],"on":[42,153,189],"linguistic":[44],"structural":[46],"challenges":[47],"that":[48,122],"are":[49,101],"inherent":[50],"this":[52],"task.":[53],"This":[54,168],"builds":[56],"upon":[57],"previous":[58],"research":[59,188],"by":[60],"incorporating":[61],"variety":[63],"heterogeneous":[65],"sources,":[67],"including":[68,93],"manually":[69],"annotated":[70],"responses,":[72],"comprehensive":[74],"synonym":[75],"dataset,":[76],"online":[77],"advertisements":[79],"(OJAs),":[80],"vocational":[82],"education":[83],"training":[85],"from":[87],"DAZUBI.":[88],"Conventional":[89],"machine":[90],"learning":[91],"models,":[92],"logistic":[94],"regression,":[95],"naive":[96],"Bayes,":[97],"random":[99],"forest,":[100],"employed":[102],"assess":[104],"performance":[107,140],"at":[108,136],"varying":[109],"taxonomic":[110],"levels":[111],"KldB.":[114],"findings":[116,146],"demonstrate":[121],"while":[123],"substantial":[124],"results":[125],"can":[126],"be":[127],"achieved":[128],"for":[129,186],"broad":[130],"occupational":[131,191],"categories,":[132],"fine-grained":[133],"classification,":[134],"particularly":[135],"level":[138],"(5th":[141],"digit),":[142],"remains":[143],"challenging.":[144],"underscore":[147,157],"limitations":[149],"relying":[151],"solely":[152],"importance":[159],"richer":[161],"contextual":[162],"information":[163],"more":[165],"expressive":[166],"models.":[167],"work":[169],"provides":[170],"both":[171],"an":[172],"expanded":[173],"dataset":[174],"systematic":[177],"analysis":[178],"performance,":[181],"thereby":[182],"establishing":[183],"foundation":[185],"future":[187],"context-aware":[190],"coding":[192],"in":[193],"market.":[197]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-11T00:00:00"}
