{"id":"https://openalex.org/W3123272955","doi":"https://doi.org/10.1109/vcip53242.2021.9675376","title":"Progressive Co-Attention Network for Fine-Grained Visual Classification","display_name":"Progressive Co-Attention Network for Fine-Grained Visual Classification","publication_year":2021,"publication_date":"2021-12-05","ids":{"openalex":"https://openalex.org/W3123272955","doi":"https://doi.org/10.1109/vcip53242.2021.9675376","mag":"3123272955"},"language":"en","primary_location":{"id":"doi:10.1109/vcip53242.2021.9675376","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip53242.2021.9675376","pdf_url":null,"source":{"id":"https://openalex.org/S4363608378","display_name":"2021 International Conference on Visual Communications and Image Processing (VCIP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100371729","display_name":"Tian Zhang","orcid":"https://orcid.org/0000-0002-1284-1232"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tian Zhang","raw_affiliation_strings":["Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007417490","display_name":"Dongliang Chang","orcid":"https://orcid.org/0000-0002-4081-3001"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongliang Chang","raw_affiliation_strings":["Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039812471","display_name":"Zhanyu Ma","orcid":"https://orcid.org/0000-0003-2950-2488"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhanyu Ma","raw_affiliation_strings":["Beijing Academy of Artificial Intelligence, Beijing, China","Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Academy of Artificial Intelligence, Beijing, China","institution_ids":["https://openalex.org/I4210100255"]},{"raw_affiliation_string":"Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100445470","display_name":"Jun Guo","orcid":"https://orcid.org/0000-0001-9045-1339"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Guo","raw_affiliation_strings":["Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Pattern Recognition and Intelligent System Lab., Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100371729"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":2.7574,"has_fulltext":false,"cited_by_count":60,"citation_normalized_percentile":{"value":0.93452722,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.9243016839027405},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7838064432144165},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7151936292648315},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6775869131088257},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6137179732322693},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5855460166931152},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5799959301948547},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5544819831848145},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.5222424268722534},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5101040005683899},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5024192333221436},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.45459723472595215},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4216846227645874},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4214169681072235},{"id":"https://openalex.org/keywords/attention-network","display_name":"Attention network","score":0.41316890716552734},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3865029215812683},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.38643327355384827}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.9243016839027405},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7838064432144165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7151936292648315},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6775869131088257},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6137179732322693},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5855460166931152},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5799959301948547},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5544819831848145},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.5222424268722534},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5101040005683899},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5024192333221436},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.45459723472595215},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4216846227645874},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4214169681072235},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.41316890716552734},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3865029215812683},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.38643327355384827},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/vcip53242.2021.9675376","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip53242.2021.9675376","pdf_url":null,"source":{"id":"https://openalex.org/S4363608378","display_name":"2021 International Conference on Visual Communications and Image Processing (VCIP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7599999904632568}],"awards":[{"id":"https://openalex.org/G3515233813","display_name":null,"funder_award_id":"61922015,61773071,U19B2036","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6510677135","display_name":null,"funder_award_id":"2019YFF0303300,2019YFF0303302","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G7697810044","display_name":null,"funder_award_id":"Z200002","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W603908379","https://openalex.org/W1686810756","https://openalex.org/W1797268635","https://openalex.org/W1846799578","https://openalex.org/W1967632700","https://openalex.org/W2097117768","https://openalex.org/W2104657103","https://openalex.org/W2108598243","https://openalex.org/W2118696714","https://openalex.org/W2119525058","https://openalex.org/W2135706578","https://openalex.org/W2138011018","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2520774990","https://openalex.org/W2554320282","https://openalex.org/W2604195031","https://openalex.org/W2618530766","https://openalex.org/W2737725206","https://openalex.org/W2740620254","https://openalex.org/W2773003563","https://openalex.org/W2780838211","https://openalex.org/W2798365843","https://openalex.org/W2807931652","https://openalex.org/W2891951760","https://openalex.org/W2953915809","https://openalex.org/W2962858109","https://openalex.org/W2963066927","https://openalex.org/W2963407932","https://openalex.org/W2975251395","https://openalex.org/W2986821660","https://openalex.org/W2997426000","https://openalex.org/W2998619563","https://openalex.org/W3008809756","https://openalex.org/W3012202123","https://openalex.org/W3035367622","https://openalex.org/W3108870912","https://openalex.org/W6618372016","https://openalex.org/W6637373629","https://openalex.org/W6677700107","https://openalex.org/W6726946684","https://openalex.org/W6767607757","https://openalex.org/W6773968463"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W2761785940","https://openalex.org/W2129933262","https://openalex.org/W3128220219","https://openalex.org/W2565656575","https://openalex.org/W4386215069"],"abstract_inverted_index":{"Fine-grained":[0],"visual":[1,132],"classification":[2,133],"aims":[3],"to":[4,8,21,46,66,87,112,116],"recognize":[5,47],"images":[6],"belonging":[7],"multiple":[9],"sub-categories":[10],"within":[11,83],"a":[12,17],"same":[13],"category.":[14],"It":[15],"is":[16,97],"challenging":[18],"task":[19],"due":[20],"the":[22,42,73,80,89,104,109,114],"inherently":[23],"subtle":[24],"variations":[25],"among":[26],"highly-confused":[27],"categories.":[28],"Most":[29],"existing":[30],"methods":[31],"only":[32],"take":[33],"an":[34,58],"individual":[35],"image":[36,85],"as":[37],"input,":[38],"which":[39],"may":[40],"limit":[41],"ability":[43],"of":[44],"models":[45],"contrastive":[48],"clues":[49],"from":[50],"different":[51],"images.":[52],"In":[53],"this":[54,68],"paper,":[55],"we":[56,71,102],"propose":[57],"effective":[59],"method":[60],"called":[61],"progressive":[62],"co-attention":[63],"network":[64,115],"(PCA-Net)":[65],"tackle":[67],"problem.":[69],"Specifically,":[70],"calculate":[72],"channel-wise":[74],"similarity":[75],"by":[76,108],"encouraging":[77],"interaction":[78,111],"between":[79],"feature":[81],"channels":[82],"same-category":[84],"pairs":[86],"capture":[88],"common":[90],"discriminative":[91,120],"features.":[92],"Considering":[93],"that":[94],"complementary":[95],"information":[96],"also":[98],"crucial":[99],"for":[100],"recognition,":[101],"erase":[103],"prominent":[105],"areas":[106],"enhanced":[107],"channel":[110],"force":[113],"focus":[117],"on":[118,129],"other":[119],"regions.":[121],"The":[122],"proposed":[123],"model":[124],"has":[125],"achieved":[126],"competitive":[127],"results":[128],"three":[130],"fine-grained":[131],"benchmark":[134],"datasets:":[135],"CUB-200-2011,":[136],"Stanford":[137],"Cars,":[138],"and":[139],"FGVC":[140],"Aircraft.":[141]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":4}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
