{"id":"https://openalex.org/W4409920596","doi":"https://doi.org/10.1007/s00521-025-11226-1","title":"NiNformer: a network in network transformer with token mixing\u00a0generated gating function","display_name":"NiNformer: a network in network transformer with token mixing\u00a0generated gating function","publication_year":2025,"publication_date":"2025-04-29","ids":{"openalex":"https://openalex.org/W4409920596","doi":"https://doi.org/10.1007/s00521-025-11226-1"},"language":"en","primary_location":{"id":"doi:10.1007/s00521-025-11226-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11226-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11226-1.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11226-1.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018672713","display_name":"Abdullah Nazhat Abdullah","orcid":"https://orcid.org/0000-0002-1757-0785"},"institutions":[{"id":"https://openalex.org/I128277893","display_name":"Bah\u00e7e\u015fehir University","ror":"https://ror.org/00yze4d93","country_code":"TR","type":"education","lineage":["https://openalex.org/I128277893"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Abdullah Nazhat Abdullah","raw_affiliation_strings":["Computer Engineering Department, Bahcesehir University, Istanbul, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-1757-0785","affiliations":[{"raw_affiliation_string":"Computer Engineering Department, Bahcesehir University, Istanbul, Turkey","institution_ids":["https://openalex.org/I128277893"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039551082","display_name":"Tarkan Ayd\u0131n","orcid":"https://orcid.org/0000-0002-2018-405X"},"institutions":[{"id":"https://openalex.org/I128277893","display_name":"Bah\u00e7e\u015fehir University","ror":"https://ror.org/00yze4d93","country_code":"TR","type":"education","lineage":["https://openalex.org/I128277893"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Tarkan Aydin","raw_affiliation_strings":["Computer Engineering Department, Bahcesehir University, Istanbul, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-2018-405X","affiliations":[{"raw_affiliation_string":"Computer Engineering Department, Bahcesehir University, Istanbul, Turkey","institution_ids":["https://openalex.org/I128277893"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5018672713"],"corresponding_institution_ids":["https://openalex.org/I128277893"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06279897,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"37","issue":"19","first_page":"13411","last_page":"13428"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5511408448219299},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.49819207191467285},{"id":"https://openalex.org/keywords/mixing","display_name":"Mixing (physics)","score":0.4844529628753662},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.4630261957645416},{"id":"https://openalex.org/keywords/gating","display_name":"Gating","score":0.4418966770172119},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.27260226011276245},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.1805342137813568},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.14601990580558777},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1393994688987732},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.10721546411514282}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5511408448219299},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.49819207191467285},{"id":"https://openalex.org/C138777275","wikidata":"https://www.wikidata.org/wiki/Q6884054","display_name":"Mixing (physics)","level":2,"score":0.4844529628753662},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.4630261957645416},{"id":"https://openalex.org/C194544171","wikidata":"https://www.wikidata.org/wiki/Q21105679","display_name":"Gating","level":2,"score":0.4418966770172119},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.27260226011276245},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.1805342137813568},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.14601990580558777},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1393994688987732},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.10721546411514282},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00521-025-11226-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11226-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11226-1.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00521-025-11226-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11226-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-025-11226-1.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320329122","display_name":"Bah\u00e7e\u015fehir \u00dcniversitesi","ror":"https://ror.org/00yze4d93"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409920596.pdf","grobid_xml":"https://content.openalex.org/works/W4409920596.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W2112796928","https://openalex.org/W2915716523","https://openalex.org/W2964110616","https://openalex.org/W3085139254","https://openalex.org/W3096609285","https://openalex.org/W3101118213","https://openalex.org/W3138516171","https://openalex.org/W3145602566","https://openalex.org/W3162090017","https://openalex.org/W3173365702","https://openalex.org/W3213368993","https://openalex.org/W4206706211","https://openalex.org/W4306955484","https://openalex.org/W4312847199","https://openalex.org/W4389666313","https://openalex.org/W4390874575","https://openalex.org/W4407196897","https://openalex.org/W6600109629","https://openalex.org/W6600116659","https://openalex.org/W6600159499","https://openalex.org/W6600281463","https://openalex.org/W6600581554","https://openalex.org/W6600741150","https://openalex.org/W6605052884","https://openalex.org/W6756688054"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2031449089","https://openalex.org/W2112596406","https://openalex.org/W2125499229","https://openalex.org/W2072696177","https://openalex.org/W4387096269","https://openalex.org/W4387096026","https://openalex.org/W2410610877"],"abstract_inverted_index":{"Abstract":[0],"The":[1,155],"attention":[2,32,66,167],"mechanism":[3,33,67],"is":[4,68],"the":[5,9,31,38,52,65,76,101,105,110,119,123,125,127,151,160,165,177,181,200,207,215,220],"primary":[6],"component":[7],"of":[8,78,85,115,136,180,187,219],"transformer":[10,40],"architecture;":[11],"it":[12,73],"has":[13,46],"led":[14],"to":[15,103,150],"significant":[16],"advancements":[17],"in":[18,37,51,100,118,172,214],"deep":[19],"learning":[20,186],"spanning":[21],"many":[22,49,95,130],"domains":[23],"and":[24,42,61,71,82,108,129,138],"covering":[25],"multiple":[26,211],"tasks.":[27],"In":[28],"computer":[29],"vision,":[30],"was":[34],"first":[35],"incorporated":[36],"vision":[39,53,120,221],"(ViT),":[41],"then":[43],"its":[44],"usage":[45],"expanded":[47],"into":[48],"tasks":[50],"domain,":[54],"such":[55,116],"as":[56,147],"classification,":[57],"segmentation,":[58],"object":[59],"detection,":[60],"image":[62,216],"generation.":[63],"While":[64],"very":[69],"expressive":[70],"capable,":[72],"comes":[74],"with":[75,133,169,183],"disadvantage":[77],"being":[79],"computationally":[80],"expensive":[81],"requiring":[83],"datasets":[84,212],"considerable":[86],"size":[87,112],"for":[88],"effective":[89],"optimization.":[90],"To":[91],"address":[92],"these":[93],"shortcomings,":[94],"designs":[96],"have":[97],"been":[98],"proposed":[99,157,201],"literature":[102],"reduce":[104],"computational":[106,145,161],"burden":[107],"alleviate":[109],"data":[111],"requirements.":[113],"Examples":[114],"attempts":[117,132],"domain":[121],"are":[122],"MLP-Mixer,":[124],"Conv-Mixer,":[126],"Perceiver-IO,":[128],"more":[131],"different":[134],"sets":[135],"advantages":[137],"disadvantages.":[139],"This":[140],"paper":[141],"introduces":[142],"a":[143,170,184,193],"new":[144],"block":[146,158],"an":[148],"alternative":[149],"standard":[152],"ViT":[153],"block.":[154],"newly":[156],"reduces":[159],"requirements":[162],"by":[163,192],"replacing":[164],"normal":[166],"layers":[168],"network":[171,173],"structure,":[174],"therefore":[175],"enhancing":[176],"static":[178],"approach":[179],"MLP-Mixer":[182],"dynamic":[185],"element-wise":[188],"gating":[189],"function":[190],"generated":[191],"token-mixing":[194],"process.":[195],"Extensive":[196],"experimentation":[197],"shows":[198],"that":[199],"design":[202],"provides":[203],"better":[204],"performance":[205],"than":[206],"baseline":[208],"architectures":[209],"on":[210],"applied":[213],"classification":[217],"task":[218],"domain.":[222]},"counts_by_year":[],"updated_date":"2026-06-13T06:13:01.061226","created_date":"2025-10-10T00:00:00"}
