{"id":"https://openalex.org/W4411422051","doi":"https://doi.org/10.1007/s10032-025-00542-w","title":"SlimDoc: lightweight distillation of document transformer models","display_name":"SlimDoc: lightweight distillation of document transformer models","publication_year":2025,"publication_date":"2025-06-18","ids":{"openalex":"https://openalex.org/W4411422051","doi":"https://doi.org/10.1007/s10032-025-00542-w"},"language":"en","primary_location":{"id":"doi:10.1007/s10032-025-00542-w","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10032-025-00542-w","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10032-025-00542-w.pdf","source":{"id":"https://openalex.org/S90108747","display_name":"International Journal on Document Analysis and Recognition (IJDAR)","issn_l":"1433-2825","issn":["1433-2825","1433-2833"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal on Document Analysis and Recognition (IJDAR)","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10032-025-00542-w.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093946912","display_name":"Marcel Lamott","orcid":"https://orcid.org/0009-0009-4345-6888"},"institutions":[{"id":"https://openalex.org/I4829542","display_name":"RheinMain University of Applied Sciences","ror":"https://ror.org/0378gm372","country_code":"DE","type":"education","lineage":["https://openalex.org/I4829542"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Marcel Lamott","raw_affiliation_strings":["RheinMain University of Applied Sciences, Wiesbaden, Germany"],"affiliations":[{"raw_affiliation_string":"RheinMain University of Applied Sciences, Wiesbaden, Germany","institution_ids":["https://openalex.org/I4829542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114387767","display_name":"Muhammad Armaghan Shakir","orcid":null},"institutions":[{"id":"https://openalex.org/I929597975","display_name":"National University of Sciences and Technology","ror":"https://ror.org/03w2j5y17","country_code":"PK","type":"education","lineage":["https://openalex.org/I929597975"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Muhammad Armaghan Shakir","raw_affiliation_strings":["National University of Sciences and Technology, Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"National University of Sciences and Technology, Islamabad, Pakistan","institution_ids":["https://openalex.org/I929597975"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080230086","display_name":"Adrian Ulges","orcid":null},"institutions":[{"id":"https://openalex.org/I4829542","display_name":"RheinMain University of Applied Sciences","ror":"https://ror.org/0378gm372","country_code":"DE","type":"education","lineage":["https://openalex.org/I4829542"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Adrian Ulges","raw_affiliation_strings":["RheinMain University of Applied Sciences, Wiesbaden, Germany"],"affiliations":[{"raw_affiliation_string":"RheinMain University of Applied Sciences, Wiesbaden, Germany","institution_ids":["https://openalex.org/I4829542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093946913","display_name":"Yves-Noel Weweler","orcid":null},"institutions":[{"id":"https://openalex.org/I4210109972","display_name":"Insiders Technologies (Germany)","ror":"https://ror.org/0179g4w23","country_code":"DE","type":"company","lineage":["https://openalex.org/I4210109972"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Yves-Noel Weweler","raw_affiliation_strings":["Insiders Technologies GmbH, Kaiserslautern, Germany"],"affiliations":[{"raw_affiliation_string":"Insiders Technologies GmbH, Kaiserslautern, Germany","institution_ids":["https://openalex.org/I4210109972"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003304863","display_name":"Faisal Shafait","orcid":"https://orcid.org/0000-0002-0922-0566"},"institutions":[{"id":"https://openalex.org/I929597975","display_name":"National University of Sciences and Technology","ror":"https://ror.org/03w2j5y17","country_code":"PK","type":"education","lineage":["https://openalex.org/I929597975"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Faisal Shafait","raw_affiliation_strings":["National University of Sciences and Technology, Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"National University of Sciences and Technology, Islamabad, Pakistan","institution_ids":["https://openalex.org/I929597975"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5093946912"],"corresponding_institution_ids":["https://openalex.org/I4829542"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07066718,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":"3","first_page":"457","last_page":"473"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6850571632385254},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5659540891647339},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4834374189376831},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4823398292064667},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.47518932819366455},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4653276801109314},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.4092394709587097},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32039546966552734},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09650906920433044}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6850571632385254},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5659540891647339},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4834374189376831},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4823398292064667},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.47518932819366455},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4653276801109314},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4092394709587097},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32039546966552734},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09650906920433044},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s10032-025-00542-w","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10032-025-00542-w","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10032-025-00542-w.pdf","source":{"id":"https://openalex.org/S90108747","display_name":"International Journal on Document Analysis and Recognition (IJDAR)","issn_l":"1433-2825","issn":["1433-2825","1433-2833"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal on Document Analysis and Recognition (IJDAR)","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s10032-025-00542-w","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10032-025-00542-w","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10032-025-00542-w.pdf","source":{"id":"https://openalex.org/S90108747","display_name":"International Journal on Document Analysis and Recognition (IJDAR)","issn_l":"1433-2825","issn":["1433-2825","1433-2833"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal on Document Analysis and Recognition (IJDAR)","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4411422051.pdf","grobid_xml":"https://content.openalex.org/works/W4411422051.grobid-xml"},"referenced_works_count":48,"referenced_works":["https://openalex.org/W1965555277","https://openalex.org/W2896457183","https://openalex.org/W2949849869","https://openalex.org/W2963122961","https://openalex.org/W2963899988","https://openalex.org/W2965373594","https://openalex.org/W2970454332","https://openalex.org/W2978017171","https://openalex.org/W2981852735","https://openalex.org/W2986619406","https://openalex.org/W2997154779","https://openalex.org/W3003484198","https://openalex.org/W3023264106","https://openalex.org/W3034999214","https://openalex.org/W3049480682","https://openalex.org/W3101007570","https://openalex.org/W3104953317","https://openalex.org/W3105966348","https://openalex.org/W3120043490","https://openalex.org/W3176664887","https://openalex.org/W3176851559","https://openalex.org/W3200672527","https://openalex.org/W3216533828","https://openalex.org/W4213213306","https://openalex.org/W4226020328","https://openalex.org/W4229907684","https://openalex.org/W4287271794","https://openalex.org/W4304013646","https://openalex.org/W4304014014","https://openalex.org/W4320481960","https://openalex.org/W4322718191","https://openalex.org/W4379256266","https://openalex.org/W4391375196","https://openalex.org/W4392019445","https://openalex.org/W4402422437","https://openalex.org/W4402430708","https://openalex.org/W4402670523","https://openalex.org/W6637551013","https://openalex.org/W6638523607","https://openalex.org/W6680532216","https://openalex.org/W6739901393","https://openalex.org/W6778883912","https://openalex.org/W6796581206","https://openalex.org/W6847076894","https://openalex.org/W6852962002","https://openalex.org/W6853251322","https://openalex.org/W6856051742","https://openalex.org/W6906869370"],"related_works":["https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2142795561","https://openalex.org/W4205302943","https://openalex.org/W2561132942","https://openalex.org/W3155418658","https://openalex.org/W4243199227","https://openalex.org/W2379948177","https://openalex.org/W2119949815"],"abstract_inverted_index":{"Abstract":[0],"Deploying":[1],"state-of-the-art":[2],"document":[3,37,47,65,96,119,215,225],"understanding":[4,38,97,120,226],"models":[5,39,68,129,227],"remains":[6],"resource-intensive":[7],"and":[8,20,46,90,108,189,217,229,233],"impractical":[9],"in":[10],"many":[11],"real-world":[12],"scenarios,":[13],"particularly":[14],"where":[15],"labeled":[16,53,165],"data":[17,235],"is":[18,86,236],"scarce":[19],"computational":[21],"budgets":[22],"are":[23],"constrained.":[24],"To":[25],"address":[26],"these":[27],"challenges,":[28],"this":[29],"work":[30],"proposes":[31],"a":[32,105,109,169,202],"novel":[33],"approach":[34,59,85,210],"towards":[35],"parameter-efficient":[36],"capable":[40],"of":[41,95,112,141,158,182,185,198,201],"adapting":[42],"to":[43,62,92,102,211,218],"specific":[44],"tasks":[45],"types":[48],"without":[49],"the":[50,93,113,142,146,159,183,199,222],"need":[51],"for":[52],"data.":[54],"Specifically,":[55],"we":[56,167],"propose":[57],"an":[58],"coined":[60],"SlimDoc":[61,101],"distill":[63],"multimodal":[64],"transformer":[66],"encoder":[67],"into":[69],"smaller":[70],"student":[71,128,171],"models,":[72],"using":[73],"internal":[74],"signals":[75],"at":[76,238],"different":[77],"training":[78,234],"stages,":[79],"followed":[80],"by":[81,88],"external":[82],"signals.":[83],"Our":[84,126,231],"inspired":[87],"TinyBERT":[89],"adapted":[91],"domain":[94],"transformers.":[98],"We":[99,206],"demonstrate":[100,122,207],"outperform":[103],"both":[104],"single-stage":[106],"distillation":[107,209],"direct":[110],"fine-tuning":[111],"student.":[114],"Experimental":[115],"results":[116],"across":[117],"six":[118],"datasets":[121],"our":[123,208],"approach\u2019s":[124],"effectiveness:":[125],"distilled":[127],"achieve":[130,149],"on":[131,214,221],"average":[132],"$$93.0\\%$$":[133],"<mml:math":[134,151,175,191],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\">":[135,152,176,192],"<mml:mrow>":[136,153,177,193],"<mml:mn>93.0</mml:mn>":[137],"<mml:mo>%</mml:mo>":[138,155,179,195],"</mml:mrow>":[139,156,180,196],"</mml:math>":[140,157,181,197],"teacher\u2019s":[143,160],"performance,":[144],"while":[145],"fine-tuned":[147],"students":[148],"$$87.0\\%$$":[150],"<mml:mn>87.0</mml:mn>":[154],"performance.":[161],"Without":[162],"requiring":[163],"any":[164],"data,":[166],"create":[168],"compact":[170],"which":[172],"achieves":[173],"$$96.0\\%$$":[174],"<mml:mn>96.0</mml:mn>":[178],"performance":[184,200],"its":[186],"supervised-distilled":[187],"counterpart":[188],"$$86.2\\%$$":[190],"<mml:mn>86.2</mml:mn>":[194],"supervised-fine-tuned":[203],"teacher":[204],"model.":[205],"pick":[212],"up":[213],"geometry":[216],"be":[219],"effective":[220],"two":[223],"popular":[224],"LiLT":[228],"LayoutLMv3.":[230],"implementation":[232],"available":[237],"https://github.com/marcel-lamott/SlimDoc":[239],".":[240]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
