{"id":"https://openalex.org/W4327737695","doi":"https://doi.org/10.3390/info14030187","title":"A Systematic Review of Transformer-Based Pre-Trained Language Models through Self-Supervised Learning","display_name":"A Systematic Review of Transformer-Based Pre-Trained Language Models through Self-Supervised Learning","publication_year":2023,"publication_date":"2023-03-16","ids":{"openalex":"https://openalex.org/W4327737695","doi":"https://doi.org/10.3390/info14030187"},"language":"en","primary_location":{"id":"doi:10.3390/info14030187","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info14030187","pdf_url":"https://www.mdpi.com/2078-2489/14/3/187/pdf?version=1678963679","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"type":"review","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2078-2489/14/3/187/pdf?version=1678963679","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077957039","display_name":"Evans Kotei","orcid":"https://orcid.org/0000-0003-0181-5247"},"institutions":[{"id":"https://openalex.org/I876193797","display_name":"Vellore Institute of Technology University","ror":"https://ror.org/00qzypv28","country_code":"IN","type":"education","lineage":["https://openalex.org/I876193797"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Evans Kotei","raw_affiliation_strings":["School of Information Technology and Engineering, Vellore Institute of Technology, Vellore 632014, India"],"raw_orcid":"https://orcid.org/0000-0003-0181-5247","affiliations":[{"raw_affiliation_string":"School of Information Technology and Engineering, Vellore Institute of Technology, Vellore 632014, India","institution_ids":["https://openalex.org/I876193797"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034745758","display_name":"Ramkumar Thirunavukarasu","orcid":"https://orcid.org/0000-0003-2798-8007"},"institutions":[{"id":"https://openalex.org/I876193797","display_name":"Vellore Institute of Technology University","ror":"https://ror.org/00qzypv28","country_code":"IN","type":"education","lineage":["https://openalex.org/I876193797"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Ramkumar Thirunavukarasu","raw_affiliation_strings":["School of Information Technology and Engineering, Vellore Institute of Technology, Vellore 632014, India"],"raw_orcid":"https://orcid.org/0000-0003-2798-8007","affiliations":[{"raw_affiliation_string":"School of Information Technology and Engineering, Vellore Institute of Technology, Vellore 632014, India","institution_ids":["https://openalex.org/I876193797"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5034745758"],"corresponding_institution_ids":["https://openalex.org/I876193797"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":12.5912,"has_fulltext":true,"cited_by_count":76,"citation_normalized_percentile":{"value":0.99077024,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"14","issue":"3","first_page":"187","last_page":"187"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8329981565475464},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6787575483322144},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6771350502967834},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.6609372496604919},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.607001781463623},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.5714921951293945},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5698449015617371},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5521376729011536},{"id":"https://openalex.org/keywords/domain-adaptation","display_name":"Domain adaptation","score":0.5294138193130493},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.470439612865448},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41584813594818115},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.21313634514808655},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.12289455533027649},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07924306392669678}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8329981565475464},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6787575483322144},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6771350502967834},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.6609372496604919},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.607001781463623},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.5714921951293945},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5698449015617371},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5521376729011536},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.5294138193130493},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.470439612865448},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41584813594818115},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.21313634514808655},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.12289455533027649},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07924306392669678},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/info14030187","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info14030187","pdf_url":"https://www.mdpi.com/2078-2489/14/3/187/pdf?version=1678963679","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:1f56bc11529648ea87049bcc497958eb","is_oa":true,"landing_page_url":"https://doaj.org/article/1f56bc11529648ea87049bcc497958eb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Information, Vol 14, Iss 3, p 187 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2078-2489/14/3/187/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/info14030187","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Information; Volume 14; Issue 3; Pages: 187","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/info14030187","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info14030187","pdf_url":"https://www.mdpi.com/2078-2489/14/3/187/pdf?version=1678963679","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.5699999928474426}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4327737695.pdf"},"referenced_works_count":114,"referenced_works":["https://openalex.org/W1566289585","https://openalex.org/W1614298861","https://openalex.org/W1686810756","https://openalex.org/W1840435438","https://openalex.org/W1999554638","https://openalex.org/W2014079492","https://openalex.org/W2022479123","https://openalex.org/W2120615054","https://openalex.org/W2130942839","https://openalex.org/W2133564696","https://openalex.org/W2138857742","https://openalex.org/W2157331557","https://openalex.org/W2165698076","https://openalex.org/W2267186426","https://openalex.org/W2396881363","https://openalex.org/W2407776548","https://openalex.org/W2594990650","https://openalex.org/W2618530766","https://openalex.org/W2806758205","https://openalex.org/W2891631795","https://openalex.org/W2896457183","https://openalex.org/W2911489562","https://openalex.org/W2914526845","https://openalex.org/W2923014074","https://openalex.org/W2948902769","https://openalex.org/W2962784628","https://openalex.org/W2963026768","https://openalex.org/W2963250244","https://openalex.org/W2963716420","https://openalex.org/W2963846996","https://openalex.org/W2970368801","https://openalex.org/W2970597249","https://openalex.org/W2971196067","https://openalex.org/W2971207485","https://openalex.org/W2971258845","https://openalex.org/W2982021527","https://openalex.org/W2982213159","https://openalex.org/W2989539713","https://openalex.org/W2989676862","https://openalex.org/W2996035354","https://openalex.org/W2996264288","https://openalex.org/W2996822578","https://openalex.org/W2998957378","https://openalex.org/W2999219213","https://openalex.org/W3001434439","https://openalex.org/W3007007518","https://openalex.org/W3011411500","https://openalex.org/W3013601031","https://openalex.org/W3016187590","https://openalex.org/W3017637887","https://openalex.org/W3017961061","https://openalex.org/W3034255912","https://openalex.org/W3034999214","https://openalex.org/W3035390927","https://openalex.org/W3035396860","https://openalex.org/W3036601975","https://openalex.org/W3037063616","https://openalex.org/W3047171714","https://openalex.org/W3089168780","https://openalex.org/W3092448486","https://openalex.org/W3092462694","https://openalex.org/W3094834348","https://openalex.org/W3098085362","https://openalex.org/W3098469895","https://openalex.org/W3099950029","https://openalex.org/W3100110884","https://openalex.org/W3103368673","https://openalex.org/W3112689365","https://openalex.org/W3115462295","https://openalex.org/W3118043957","https://openalex.org/W3128090102","https://openalex.org/W3133650345","https://openalex.org/W3135427360","https://openalex.org/W3153266325","https://openalex.org/W3156665996","https://openalex.org/W3157876196","https://openalex.org/W3160137267","https://openalex.org/W3164045210","https://openalex.org/W3164896303","https://openalex.org/W3169113923","https://openalex.org/W3169483174","https://openalex.org/W3171975879","https://openalex.org/W3173151551","https://openalex.org/W3175870271","https://openalex.org/W3175898847","https://openalex.org/W3176617251","https://openalex.org/W3185909895","https://openalex.org/W3193158708","https://openalex.org/W3211490618","https://openalex.org/W4206706211","https://openalex.org/W4288089799","https://openalex.org/W4290875442","https://openalex.org/W4297730150","https://openalex.org/W4309548228","https://openalex.org/W4311430112","https://openalex.org/W4312846227","https://openalex.org/W4313550290","https://openalex.org/W4385245566","https://openalex.org/W6679436768","https://openalex.org/W6680300913","https://openalex.org/W6735377749","https://openalex.org/W6739901393","https://openalex.org/W6745682157","https://openalex.org/W6763701032","https://openalex.org/W6769627184","https://openalex.org/W6772299980","https://openalex.org/W6775774072","https://openalex.org/W6780218876","https://openalex.org/W6781275321","https://openalex.org/W6784416658","https://openalex.org/W6788210547","https://openalex.org/W6797132756","https://openalex.org/W6797399245","https://openalex.org/W7051469422"],"related_works":["https://openalex.org/W3099765033","https://openalex.org/W4220996320","https://openalex.org/W4312200629","https://openalex.org/W4382286161","https://openalex.org/W3035162004","https://openalex.org/W2960456850","https://openalex.org/W2946016983","https://openalex.org/W4317565044","https://openalex.org/W4361732492","https://openalex.org/W3186919929"],"abstract_inverted_index":{"Transfer":[0],"learning":[1,8,101,175],"is":[2,21],"a":[3,15,28,161,168],"technique":[4],"utilized":[5],"in":[6,33,179,196],"deep":[7,108],"applications":[9],"to":[10,14,23,121,142,151,185,193],"transmit":[11],"learned":[12],"inference":[13],"different":[16],"target":[17],"domain.":[18],"The":[19,40,96],"approach":[20],"mainly":[22],"solve":[24],"the":[25,66,77,107,115],"problem":[26],"of":[27,171],"few":[29],"training":[30,160],"datasets":[31,132],"resulting":[32],"model":[34,38,162],"overfitting,":[35],"which":[36,64],"affects":[37],"performance.":[39],"study":[41,97],"was":[42],"carried":[43],"out":[44],"on":[45,84,99,106,128],"publications":[46,91],"retrieved":[47,72],"from":[48,73,163],"various":[49],"digital":[50],"libraries":[51],"such":[52,147],"as":[53,148],"SCOPUS,":[54],"ScienceDirect,":[55],"IEEE":[56],"Xplore,":[57],"ACM":[58],"Digital":[59],"Library,":[60],"and":[61,79,87,112,124,176,182],"Google":[62],"Scholar,":[63],"formed":[65],"Primary":[67,74],"studies.":[68],"Secondary":[69],"studies":[70],"were":[71,92,114],"articles":[75],"using":[76],"backward":[78],"forward":[80],"snowballing":[81],"approach.":[82],"Based":[83],"set":[85],"inclusion":[86],"exclusion":[88],"parameters,":[89],"relevant":[90],"selected":[93],"for":[94],"review.":[95],"focused":[98],"transfer":[100,150],"pretrained":[102,118,197],"NLP":[103],"models":[104,119,138],"based":[105,127],"transformer":[109,137,172],"network.":[110],"BERT":[111],"GPT":[113],"two":[116],"elite":[117],"trained":[120],"classify":[122],"global":[123],"local":[125],"representations":[126],"larger":[129],"unlabeled":[130],"text":[131],"through":[133],"self-supervised":[134,174],"learning.":[135],"Pretrained":[136],"offer":[139],"numerous":[140],"advantages":[141],"natural":[143],"language":[144,180,199],"processing":[145],"models,":[146,181],"knowledge":[149],"downstream":[152,186],"tasks":[153],"that":[154],"deal":[155],"with":[156,159],"drawbacks":[157],"associated":[158],"scratch.":[164],"This":[165],"review":[166],"gives":[167],"comprehensive":[169],"view":[170],"architecture,":[173],"pretraining":[177],"concepts":[178],"their":[183],"adaptation":[184],"tasks.":[187],"Finally,":[188],"we":[189],"present":[190],"future":[191],"directions":[192],"further":[194],"improvement":[195],"transformer-based":[198],"models.":[200]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":28},{"year":2024,"cited_by_count":32},{"year":2023,"cited_by_count":10}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
