{"id":"https://openalex.org/W3194784984","doi":"https://doi.org/10.1145/3469213.3470323","title":"Attention-Guided CutMix Data Augmentation Network for Fine-Grained Bird Recognition","display_name":"Attention-Guided CutMix Data Augmentation Network for Fine-Grained Bird Recognition","publication_year":2021,"publication_date":"2021-05-28","ids":{"openalex":"https://openalex.org/W3194784984","doi":"https://doi.org/10.1145/3469213.3470323","mag":"3194784984"},"language":"en","primary_location":{"id":"doi:10.1145/3469213.3470323","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3469213.3470323","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 2nd International Conference on Artificial Intelligence and Information Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101130385","display_name":"Wenming Guo","orcid":"https://orcid.org/0000-0003-4167-4557"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenming Guo","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100365573","display_name":"Yifei Wang","orcid":"https://orcid.org/0000-0002-0688-6012"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifei Wang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101620682","display_name":"Fang Han","orcid":"https://orcid.org/0000-0002-1937-4710"},"institutions":[{"id":"https://openalex.org/I4210111575","display_name":"Xinjiang Institute of Engineering","ror":"https://ror.org/01s5hh873","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210111575","https://openalex.org/I4210157944"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fang Han","raw_affiliation_strings":["Xinjiang Institute of Engineering, China"],"affiliations":[{"raw_affiliation_string":"Xinjiang Institute of Engineering, China","institution_ids":["https://openalex.org/I4210111575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101130385"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.1769,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.50414508,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.8580679893493652},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8276842832565308},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.679796576499939},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6663112640380859},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5977429747581482},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5905391573905945},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5305545330047607},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.521893322467804},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.457286536693573},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4390179514884949},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.4301515519618988},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.4237039089202881},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3154430687427521}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.8580679893493652},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8276842832565308},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.679796576499939},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6663112640380859},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5977429747581482},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5905391573905945},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5305545330047607},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.521893322467804},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.457286536693573},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4390179514884949},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.4301515519618988},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.4237039089202881},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3154430687427521},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3469213.3470323","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3469213.3470323","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 2nd International Conference on Artificial Intelligence and Information Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7599999904632568,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W2104657103","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2462457117","https://openalex.org/W2520774990","https://openalex.org/W2737725206","https://openalex.org/W2763070548","https://openalex.org/W2773003563"],"related_works":["https://openalex.org/W2404514746","https://openalex.org/W2743258233","https://openalex.org/W2806866760","https://openalex.org/W2586441539","https://openalex.org/W2902062472","https://openalex.org/W2311479510","https://openalex.org/W1905704307","https://openalex.org/W2207021851","https://openalex.org/W2905846897","https://openalex.org/W3131127372"],"abstract_inverted_index":{"Large":[0],"inter-class":[1],"variations,":[2],"intra-class":[3],"similarities":[4],"and":[5,65,100,107,136,160,193],"the":[6,48,94,155,161,164,187,191,199],"difficulties":[7],"in":[8,16],"collectiing":[9],"training":[10,122,162],"samples":[11],"are":[12],"three":[13],"major":[14],"challenges":[15],"fine-grained":[17],"bird":[18],"recognition.":[19],"Hence,":[20],"it's":[21],"essential":[22],"for":[23],"accurate":[24],"classification":[25,188],"that":[26,180],"achieving":[27],"a":[28,72,83,112,129,148],"discriminative":[29,80,131],"feature":[30,63,98],"representation":[31],"from":[32,68],"birds\u2019":[33,58],"parts.":[34,59],"In":[35,146],"this":[36],"work,":[37],"we":[38,61,110],"propose":[39],"Attention-Guided":[40],"CutMix":[41],"Data":[42],"Augmentation":[43],"Network":[44],"(AGCN)":[45],"to":[46,50,104,117,141,152],"exercise":[47],"network":[49,192],"pay":[51],"more":[52],"attention":[53,66,77,101,127,158],"on":[54,125,198],"subtle":[55],"features":[56,88],"about":[57],"Firstly,":[60],"generate":[62,142],"maps":[64,67,99,159],"an":[69,126,143],"image":[70,140],"by":[71,93],"backbone":[73],"network.":[74,165],"Specially,":[75],"each":[76,121],"map":[78],"contains":[79],"information":[81],"of":[82,157,163,190],"bird's":[84,130],"part.":[85],"Then":[86],"local":[87],"can":[89],"be":[90],"further":[91],"extracted":[92],"element-wise":[95],"multiplication":[96],"between":[97],"maps.":[102],"Next,":[103],"reduce":[105],"overfitting":[106],"optimize":[108],"performance,":[109],"design":[111],"data":[113,183],"augmentation":[114,184],"strategy":[115],"according":[116],"region-level":[118],"replacement.":[119],"For":[120],"image,":[123],"based":[124],"map,":[128],"region":[132],"is":[133,150],"located,":[134],"copied":[135],"pasted":[137],"into":[138],"another":[139],"augmented":[144],"image.":[145],"addition,":[147],"loss":[149],"designed":[151],"supervise":[153],"both":[154],"learning":[156],"AGCN":[166,194],"only":[167],"needs":[168],"image-level":[169],"category":[170],"labels":[171],"rather":[172],"than":[173],"bounding":[174],"boxes/part":[175],"annotations.":[176],"The":[177],"results":[178],"state":[179],"our":[181],"proposed":[182],"effectively":[185],"improves":[186],"performance":[189,197],"achieves":[195],"excellent":[196],"challenging":[200],"dataset,":[201],"CUB":[202],"Birds.":[203]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
