{"id":"https://openalex.org/W4402352450","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650050","title":"From Static to Dynamic: A Deeper, Faster, and Adaptive Language Modeling Approach","display_name":"From Static to Dynamic: A Deeper, Faster, and Adaptive Language Modeling Approach","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402352450","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650050"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10650050","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10650050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090543127","display_name":"Jiajia Li","orcid":"https://orcid.org/0009-0003-7143-9336"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiajia Li","raw_affiliation_strings":["Wuhan University,School of Information Management,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Information Management,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061142418","display_name":"Q. Li","orcid":"https://orcid.org/0009-0007-2531-6537"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiwei Li","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101686826","display_name":"Ping Wang","orcid":"https://orcid.org/0000-0002-0792-4113"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Wang","raw_affiliation_strings":["Wuhan University,Center for the Studies of Information Resources School of Information Management,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,Center for the Studies of Information Resources School of Information Management,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5090543127"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12476905,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"1","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.951200008392334,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7474079132080078}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7474079132080078}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10650050","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10650050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W1566289585","https://openalex.org/W1690739335","https://openalex.org/W1724438581","https://openalex.org/W2108278040","https://openalex.org/W2144578941","https://openalex.org/W2896457183","https://openalex.org/W2923014074","https://openalex.org/W2924902521","https://openalex.org/W2938830017","https://openalex.org/W2946794439","https://openalex.org/W2952902402","https://openalex.org/W2962677625","https://openalex.org/W2962784628","https://openalex.org/W2963323070","https://openalex.org/W2964110616","https://openalex.org/W2965373594","https://openalex.org/W2970106668","https://openalex.org/W2970120757","https://openalex.org/W2970597249","https://openalex.org/W2978017171","https://openalex.org/W2996428491","https://openalex.org/W2998183051","https://openalex.org/W2998385486","https://openalex.org/W3011411500","https://openalex.org/W3034457371","https://openalex.org/W3034999214","https://openalex.org/W3035030897","https://openalex.org/W3035038672","https://openalex.org/W3093968463","https://openalex.org/W3101163004","https://openalex.org/W3105966348","https://openalex.org/W3112673818","https://openalex.org/W3118485687","https://openalex.org/W3128933491","https://openalex.org/W3177265267","https://openalex.org/W3199418160","https://openalex.org/W4287824654","https://openalex.org/W4288347855","https://openalex.org/W4292779060","https://openalex.org/W4382239690","https://openalex.org/W4385245566","https://openalex.org/W4385571945","https://openalex.org/W4388187290","https://openalex.org/W4393157091","https://openalex.org/W4393160064","https://openalex.org/W6637551013","https://openalex.org/W6637709462","https://openalex.org/W6745447533","https://openalex.org/W6750615492","https://openalex.org/W6753640285","https://openalex.org/W6760732026","https://openalex.org/W6761910064","https://openalex.org/W6762945437","https://openalex.org/W6763701032","https://openalex.org/W6764409202","https://openalex.org/W6766673545","https://openalex.org/W6768021236","https://openalex.org/W6768851824","https://openalex.org/W6769227307","https://openalex.org/W6771917389","https://openalex.org/W6778883912","https://openalex.org/W6779313456","https://openalex.org/W6784536396","https://openalex.org/W6788135622","https://openalex.org/W6790709252","https://openalex.org/W6853599841"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"Transformer-empowered":[0],"Pre-trained":[1],"language":[2,12],"models":[3,132],"(PrLM)":[4],"have":[5],"achieved":[6],"great":[7],"success":[8],"in":[9,56,113],"sumless":[10],"natural":[11],"processing":[13],"tasks.":[14],"Meanwhile,":[15],"keeping":[16],"seeking":[17],"better":[18,163],"performance":[19,164],"leads":[20],"to":[21,82],"deeper":[22,24],"and":[23,85,123,137,139,149,165],"models,":[25],"which":[26,172],"is":[27,111],"surely":[28],"suboptimal":[29],"by":[30,160],"taking":[31],"the":[32,46,80,87,95,100,114,168,175],"same":[33],"deep":[34,50],"model":[35,51,81,96,158],"for":[36,52,106],"various":[37],"input":[38,91],"samples":[39],"with":[40],"different":[41],"learnable":[42],"complexities,":[43],"let":[44],"alone":[45],"unnecessity":[47],"of":[48,64,89,104,177],"too":[49],"\u2018easy\u2019":[53],"input.":[54],"Therefore":[55],"this":[57],"work,":[58],"we":[59,69],"explore":[60],"a":[61,71,120],"dynamic":[62],"use":[63,99],"Transformer":[65,110],"layers.":[66],"In":[67],"detail,":[68],"propose":[70],"novel":[72],"Transformer-the-Adaptive":[73,161],"including":[74,133],"an":[75],"estimator":[76],"module":[77],"that":[78,94,154],"enables":[79],"automatically":[83],"learn":[84],"evaluate":[86],"complexity":[88],"every":[90],"samples,":[92],"so":[93],"can":[97],"adaptively":[98],"most":[101],"economic":[102],"numbers":[103],"layers":[105],"inference.":[107],"The":[108],"proposed":[109,156],"implemented":[112],"current":[115],"state-of-the-art":[116],"PrLM,":[117],"ALBERT,":[118],"giving":[119],"deeper,":[121],"faster":[122],"adaptive":[124],"model,":[125,171],"ALBERTa.":[126],"We":[127],"train":[128],"four-size":[129],"optimized":[130,159],"ALBERTa":[131,157],"base,":[134],"large,":[135],"xlarge,":[136],"xxlarge":[138],"carry":[140],"out":[141],"experiments":[142],"on":[143],"three":[144],"typical":[145],"tasks":[146],"MRC,":[147],"NLU,":[148],"NER.":[150],"Experiment":[151],"results":[152],"show":[153],"our":[155],"has":[162],"efficiency":[166],"than":[167],"original":[169],"ALBERT":[170],"fully":[173],"reflects":[174],"effectiveness":[176],"Transformer-the-Adaptive.":[178]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
