{"id":"https://openalex.org/W4391620901","doi":"https://doi.org/10.1109/tnnls.2024.3356310","title":"Attentive Learning Facilitates Generalization of Neural Networks","display_name":"Attentive Learning Facilitates Generalization of Neural Networks","publication_year":2024,"publication_date":"2024-02-07","ids":{"openalex":"https://openalex.org/W4391620901","doi":"https://doi.org/10.1109/tnnls.2024.3356310","pmid":"https://pubmed.ncbi.nlm.nih.gov/38324433"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2024.3356310","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3356310","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036865546","display_name":"Shiye Lei","orcid":"https://orcid.org/0000-0001-7810-9346"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Shiye Lei","raw_affiliation_strings":["Sydney AI Centre and the School of Computer Science, Faculty of Engineering, The University of Sydney, Darlington, NSW, Australia","Faculty of Engineering, Sydney AI Centre and the School of Computer Science, The University of Sydney, Darlington, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"Sydney AI Centre and the School of Computer Science, Faculty of Engineering, The University of Sydney, Darlington, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"Faculty of Engineering, Sydney AI Centre and the School of Computer Science, The University of Sydney, Darlington, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100635369","display_name":"Fengxiang He","orcid":"https://orcid.org/0000-0001-5584-2385"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Fengxiang He","raw_affiliation_strings":["Artificial Intelligence and its Applications Institute, School of Informatics, University of Edinburgh, Edinburgh, U.K","School of Informatics, Artificial Intelligence and its Applications Institute, University of Edinburgh, Edinburgh, U.K"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence and its Applications Institute, School of Informatics, University of Edinburgh, Edinburgh, U.K","institution_ids":["https://openalex.org/I98677209"]},{"raw_affiliation_string":"School of Informatics, Artificial Intelligence and its Applications Institute, University of Edinburgh, Edinburgh, U.K","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027020832","display_name":"Haowen Chen","orcid":"https://orcid.org/0000-0002-9255-6772"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haowen Chen","raw_affiliation_strings":["Department of Mathematics, ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics, ETH Z&#x00FC;rich, Z&#x00FC;rich, Switzerland","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074103823","display_name":"Dacheng Tao","orcid":"https://orcid.org/0000-0001-7225-5449"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]},{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["AU","SG"],"is_corresponding":false,"raw_author_name":"Dacheng Tao","raw_affiliation_strings":["Sydney AI Centre and the School of Computer Science, Faculty of Engineering, The University of Sydney, Darlington, NSW, Australia","School of Computer Science and Engineering, Nanyang Technological University, Singapore, Singapore","Faculty of Engineering, Sydney AI Centre and the School of Computer Science, The University of Sydney, Darlington, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"Sydney AI Centre and the School of Computer Science, Faculty of Engineering, The University of Sydney, Darlington, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Faculty of Engineering, Sydney AI Centre and the School of Computer Science, The University of Sydney, Darlington, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5036865546"],"corresponding_institution_ids":["https://openalex.org/I129604602"],"apc_list":null,"apc_paid":null,"fwci":0.7252,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72621284,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"36","issue":"2","first_page":"3329","last_page":"3342"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7133251428604126},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5432780981063843},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5391576290130615},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5078769326210022},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.342682808637619},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1173422634601593}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7133251428604126},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5432780981063843},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5391576290130615},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5078769326210022},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.342682808637619},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1173422634601593},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2024.3356310","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3356310","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:38324433","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38324433","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5600000023841858,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":98,"referenced_works":["https://openalex.org/W78969641","https://openalex.org/W1686810756","https://openalex.org/W1994350438","https://openalex.org/W2001141328","https://openalex.org/W2053186076","https://openalex.org/W2068474925","https://openalex.org/W2070964041","https://openalex.org/W2084914070","https://openalex.org/W2097308346","https://openalex.org/W2120838001","https://openalex.org/W2122868074","https://openalex.org/W2124477890","https://openalex.org/W2127905518","https://openalex.org/W2194775991","https://openalex.org/W2566079294","https://openalex.org/W2593380010","https://openalex.org/W2754478492","https://openalex.org/W2766447205","https://openalex.org/W2796402180","https://openalex.org/W2903158431","https://openalex.org/W2914483840","https://openalex.org/W2963518130","https://openalex.org/W2963693826","https://openalex.org/W2963959597","https://openalex.org/W2964137095","https://openalex.org/W2981207549","https://openalex.org/W2999044305","https://openalex.org/W3004591935","https://openalex.org/W3014745075","https://openalex.org/W3022629704","https://openalex.org/W3035603281","https://openalex.org/W3084746729","https://openalex.org/W3090811446","https://openalex.org/W3093826057","https://openalex.org/W3099514962","https://openalex.org/W3102178346","https://openalex.org/W3104335155","https://openalex.org/W3118608800","https://openalex.org/W3118788053","https://openalex.org/W3121510528","https://openalex.org/W3136525286","https://openalex.org/W3159649695","https://openalex.org/W3175945177","https://openalex.org/W3177828909","https://openalex.org/W3199247446","https://openalex.org/W3210179814","https://openalex.org/W4200632698","https://openalex.org/W4206410067","https://openalex.org/W4206487645","https://openalex.org/W4213228517","https://openalex.org/W4287867670","https://openalex.org/W4298857966","https://openalex.org/W4299785371","https://openalex.org/W4300717047","https://openalex.org/W4307572631","https://openalex.org/W4320478046","https://openalex.org/W4379472738","https://openalex.org/W4384648322","https://openalex.org/W4385245566","https://openalex.org/W4385864301","https://openalex.org/W4387415233","https://openalex.org/W4388283588","https://openalex.org/W6631190155","https://openalex.org/W6637373629","https://openalex.org/W6637967152","https://openalex.org/W6674995422","https://openalex.org/W6680757391","https://openalex.org/W6683389101","https://openalex.org/W6684191040","https://openalex.org/W6713348437","https://openalex.org/W6726983090","https://openalex.org/W6734185594","https://openalex.org/W6739659843","https://openalex.org/W6741653254","https://openalex.org/W6745276634","https://openalex.org/W6745652151","https://openalex.org/W6755308174","https://openalex.org/W6764891227","https://openalex.org/W6767868811","https://openalex.org/W6773748089","https://openalex.org/W6773952175","https://openalex.org/W6778032888","https://openalex.org/W6778883912","https://openalex.org/W6779259321","https://openalex.org/W6779357159","https://openalex.org/W6782866703","https://openalex.org/W6787972765","https://openalex.org/W6788289293","https://openalex.org/W6790250994","https://openalex.org/W6796831281","https://openalex.org/W6797999826","https://openalex.org/W6803605065","https://openalex.org/W6803710616","https://openalex.org/W6805410244","https://openalex.org/W6854814838","https://openalex.org/W6922480057","https://openalex.org/W7034108470","https://openalex.org/W7071865489"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474"],"abstract_inverted_index":{"This":[0],"article":[1],"studies":[2],"the":[3,28,39,44,57,63,77,83,88,92,100],"generalization":[4,118,126],"of":[5,102,109],"neural":[6],"networks":[7],"(NNs)":[8],"by":[9,34],"examining":[10],"how":[11],"a":[12,18,73,116],"network":[13,40],"changes":[14],"when":[15],"trained":[16],"on":[17,62,91,99],"training":[19,46,93],"sample":[20],"with":[21],"or":[22],"without":[23],"out-of-distribution":[24],"(OoD)":[25],"examples.":[26],"If":[27],"network's":[29],"predictions":[30],"are":[31],"less":[32],"influenced":[33],"fitting":[35],"OoD":[36],"examples,":[37],"then":[38],"learns":[41],"attentively":[42],"from":[43,104],"clean":[45],"set.":[47],"A":[48],"new":[49],"notion,":[50],"dataset-distraction":[51,78],"stability,":[52,85],"is":[53,120],"proposed":[54],"to":[55],"measure":[56],"influence.":[58],"Extensive":[59],"CIFAR-10/100":[60],"experiments":[61],"different":[64],"VGG,":[65],"ResNet,":[66],"WideResNet,":[67],"ViT":[68],"architectures,":[69],"and":[70,80,114,133],"optimizers":[71],"show":[72],"negative":[74],"correlation":[75],"between":[76],"stability":[79],"generalizability.":[81],"With":[82],"distraction":[84],"we":[86],"decompose":[87],"learning":[89,97,129],"process":[90],"set":[94],"into":[95],"multiple":[96],"processes":[98],"subsets":[101],"drawn":[103],"simpler":[105],"distributions,":[106],"i.e.,":[107],"distributions":[108],"smaller":[110],"intrinsic":[111],"dimensions":[112],"(IDs),":[113],"furthermore,":[115],"tighter":[117],"bound":[119],"derived.":[121],"Through":[122],"attentive":[123],"learning,":[124],"miraculous":[125],"in":[127],"deep":[128],"can":[130,136],"be":[131,138],"explained":[132],"novel":[134],"algorithms":[135],"also":[137],"designed.":[139]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
