{"id":"https://openalex.org/W4407900252","doi":"https://doi.org/10.1109/access.2025.3544814","title":"LLM Teacher-Student Framework for Text Classification With No Manually Annotated Data: A Case Study in IPTC News Topic Classification","display_name":"LLM Teacher-Student Framework for Text Classification With No Manually Annotated Data: A Case Study in IPTC News Topic Classification","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4407900252","doi":"https://doi.org/10.1109/access.2025.3544814"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3544814","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3544814","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3544814","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032339009","display_name":"Taja Kuzman","orcid":"https://orcid.org/0000-0001-7436-9896"},"institutions":[{"id":"https://openalex.org/I3006985408","display_name":"Jo\u017eef Stefan Institute","ror":"https://ror.org/05060sz93","country_code":"SI","type":"facility","lineage":["https://openalex.org/I3006985408"]}],"countries":["SI"],"is_corresponding":true,"raw_author_name":"Taja Kuzman","raw_affiliation_strings":["Department of Knowledge Technologies, Jo&#x017E;ef Stefan Institute, Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Knowledge Technologies, Jo&#x017E;ef Stefan Institute, Ljubljana, Slovenia","institution_ids":["https://openalex.org/I3006985408"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021557805","display_name":"Nikola Ljube\u0161i\u0107","orcid":"https://orcid.org/0000-0001-7169-9152"},"institutions":[{"id":"https://openalex.org/I3006985408","display_name":"Jo\u017eef Stefan Institute","ror":"https://ror.org/05060sz93","country_code":"SI","type":"facility","lineage":["https://openalex.org/I3006985408"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Nikola Ljube\u0161i\u0107","raw_affiliation_strings":["Department of Knowledge Technologies, Jo&#x017E;ef Stefan Institute, Ljubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Knowledge Technologies, Jo&#x017E;ef Stefan Institute, Ljubljana, Slovenia","institution_ids":["https://openalex.org/I3006985408"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5032339009"],"corresponding_institution_ids":["https://openalex.org/I3006985408"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":25.7393,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.99362298,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"13","issue":null,"first_page":"35621","last_page":"35633"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.8809999823570251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.8809999823570251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.8269000053405762,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7861260175704956},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5176311135292053},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43501555919647217},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3775371015071869},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.37712591886520386},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3296475112438202}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7861260175704956},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5176311135292053},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43501555919647217},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3775371015071869},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.37712591886520386},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3296475112438202}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3544814","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3544814","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:4aba1de2a952493cb29a61ddeb58e0d4","is_oa":true,"landing_page_url":"https://doaj.org/article/4aba1de2a952493cb29a61ddeb58e0d4","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 35621-35633 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3544814","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3544814","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.8299999833106995,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1942605888","display_name":null,"funder_award_id":"L2-50070","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"},{"id":"https://openalex.org/G5835491414","display_name":null,"funder_award_id":"P6-0411","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"}],"funders":[{"id":"https://openalex.org/F4320322554","display_name":"Javna Agencija za Raziskovalno Dejavnost RS","ror":"https://ror.org/059bp8k51"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W2034059165","https://openalex.org/W2090240037","https://openalex.org/W2611476725","https://openalex.org/W2954365773","https://openalex.org/W2977937308","https://openalex.org/W3035390927","https://openalex.org/W3082619305","https://openalex.org/W3118179615","https://openalex.org/W3128553165","https://openalex.org/W3128655363","https://openalex.org/W3152272674","https://openalex.org/W3185236989","https://openalex.org/W4200444669","https://openalex.org/W4210764005","https://openalex.org/W4309488928","https://openalex.org/W4327811957","https://openalex.org/W4366826292","https://openalex.org/W4385571411","https://openalex.org/W4385572634","https://openalex.org/W4386566339","https://openalex.org/W4386625167","https://openalex.org/W4386714913","https://openalex.org/W4388735460","https://openalex.org/W4389524372","https://openalex.org/W4390075090","https://openalex.org/W4392828261","https://openalex.org/W4393163454","https://openalex.org/W4401042743","https://openalex.org/W4401042760","https://openalex.org/W4401043249","https://openalex.org/W4401043890","https://openalex.org/W4404783774","https://openalex.org/W6682691769","https://openalex.org/W6809361247","https://openalex.org/W6810081322","https://openalex.org/W6843398536","https://openalex.org/W6852898014","https://openalex.org/W6866949868","https://openalex.org/W6912503167"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W3188962172","https://openalex.org/W2772917594","https://openalex.org/W4312825515","https://openalex.org/W4306742369","https://openalex.org/W4303457083","https://openalex.org/W2131146434","https://openalex.org/W2951359407","https://openalex.org/W4376623224","https://openalex.org/W3204019825"],"abstract_inverted_index":{"With":[0],"the":[1,15,73,104,110,137,143,148,163,174,180,183,188,191,230,239,243],"ever-increasing":[2],"number":[3,217],"of":[4,14,53,86,150,153,182,190,218,242],"news":[5,49,79,88,232],"stories":[6],"available":[7],"online,":[8],"classifying":[9],"them":[10],"by":[11,109],"topic,":[12],"regardless":[13],"language":[16,43],"they":[17],"are":[18,97,160],"written":[19],"in,":[20],"has":[21],"become":[22],"crucial":[23],"for":[24,46,59],"enhancing":[25],"readers\u2019":[26],"access":[27],"to":[28,76,134,173],"relevant":[29],"content.":[30],"To":[31,141],"address":[32],"this":[33],"challenge,":[34],"we":[35,178,228],"propose":[36],"a":[37,66,78,214],"teacher-student":[38],"framework":[39,64],"based":[40],"on":[41,162,187],"large":[42],"models":[44,52,159,168,193,208],"(LLMs)":[45],"developing":[47],"multilingual":[48,236],"topic":[50,80,233],"classification":[51,237],"reasonable":[54],"size":[55,186],"with":[56,129,147,213,238],"no":[57],"need":[58],"manual":[60],"data":[61,185],"annotation.":[62],"The":[63,116,203],"employs":[65],"Generative":[67],"Pretrained":[68],"Transformer":[69],"(GPT)":[70],"model":[71,75,118],"as":[72],"teacher":[74,117,175],"develop":[77],"training":[81,184,219],"dataset":[82],"through":[83],"automatic":[84],"annotation":[85],"20,000":[87],"articles":[89],"in":[90,123],"Slovenian,":[91],"Croatian,":[92],"Greek,":[93],"and":[94,194,199,221],"Catalan.":[95],"Articles":[96],"classified":[98],"into":[99],"17":[100],"main":[101],"categories":[102,241],"from":[103],"Media":[105,245],"Topic":[106,246],"schema,":[107],"developed":[108],"International":[111],"Press":[112],"Telecommunications":[113],"Council":[114],"(IPTC).":[115],"exhibits":[119],"high":[120,170,211],"zero-shot":[121,200,224],"performance":[122,171,189,212],"all":[124],"four":[125],"languages.":[126],"Its":[127],"agreement":[128],"human":[130,138],"annotators":[131,139],"is":[132],"comparable":[133,172],"that":[135,206],"between":[136],"themselves.":[140],"mitigate":[142],"computational":[144],"limitations":[145],"associated":[146],"requirement":[149],"processing":[151],"millions":[152],"texts":[154],"daily,":[155],"smaller":[156],"BERT-like":[157],"student":[158,167,192,207],"fine-tuned":[161],"GPT-annotated":[164],"dataset.":[165],"These":[166],"achieve":[169,210],"model.":[176],"Furthermore,":[177],"explore":[179],"impact":[181],"investigate":[195],"their":[196],"monolingual,":[197],"multilingual,":[198],"cross-lingual":[201,225],"capabilities.":[202],"findings":[204],"indicate":[205],"can":[209],"relatively":[215],"small":[216],"instances,":[220],"demonstrate":[222],"strong":[223],"abilities.":[226],"Finally,":[227],"publish":[229],"best-performing":[231],"classifier,":[234],"enabling":[235],"top-level":[240],"IPTC":[244],"schema.":[247]},"counts_by_year":[{"year":2025,"cited_by_count":9}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
