{"id":"https://openalex.org/W2902869558","doi":"https://doi.org/10.1109/icpr.2018.8545225","title":"A Multi-part Convolutional Attention Network for Fine-Grained Image Recognition","display_name":"A Multi-part Convolutional Attention Network for Fine-Grained Image Recognition","publication_year":2018,"publication_date":"2018-08-01","ids":{"openalex":"https://openalex.org/W2902869558","doi":"https://doi.org/10.1109/icpr.2018.8545225","mag":"2902869558"},"language":"en","primary_location":{"id":"doi:10.1109/icpr.2018.8545225","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8545225","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112410699","display_name":"Weilin Zhong","orcid":"https://orcid.org/0009-0001-2960-3310"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weilin Zhong","raw_affiliation_strings":["School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101708598","display_name":"Linfeng Jiang","orcid":"https://orcid.org/0000-0001-9643-5049"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Linfeng Jiang","raw_affiliation_strings":["School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100375832","display_name":"Tao Zhang","orcid":"https://orcid.org/0000-0002-7192-5153"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Zhang","raw_affiliation_strings":["School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064423286","display_name":"Jinsheng Ji","orcid":"https://orcid.org/0000-0002-5360-919X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinsheng Ji","raw_affiliation_strings":["School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100553283","display_name":"Huilin Xiong","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huilin Xiong","raw_affiliation_strings":["School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic, Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5112410699"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.5223,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.71828542,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.9328739047050476},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.8476511240005493},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7915747761726379},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7523536682128906},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6861739158630371},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.628785252571106},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.602875828742981},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5925655364990234},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.5636934638023376},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4661266803741455},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.45962750911712646},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.43984344601631165},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.43467244505882263},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.41838985681533813},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4104700982570648},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3951629102230072}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.9328739047050476},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.8476511240005493},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7915747761726379},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7523536682128906},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6861739158630371},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.628785252571106},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.602875828742981},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5925655364990234},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.5636934638023376},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4661266803741455},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.45962750911712646},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.43984344601631165},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.43467244505882263},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.41838985681533813},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4104700982570648},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3951629102230072},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr.2018.8545225","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8545225","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7599999904632568}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W50291828","https://openalex.org/W56385144","https://openalex.org/W603908379","https://openalex.org/W1496650988","https://openalex.org/W1616462885","https://openalex.org/W1686810756","https://openalex.org/W1724369340","https://openalex.org/W1898560071","https://openalex.org/W1928906481","https://openalex.org/W2104657103","https://openalex.org/W2138011018","https://openalex.org/W2163605009","https://openalex.org/W2194011657","https://openalex.org/W2202499615","https://openalex.org/W2293078015","https://openalex.org/W2295107390","https://openalex.org/W2306952455","https://openalex.org/W2460852148","https://openalex.org/W2479109623","https://openalex.org/W2549125172","https://openalex.org/W2737725206","https://openalex.org/W2741910023","https://openalex.org/W2773003563","https://openalex.org/W2964176323","https://openalex.org/W3124951096","https://openalex.org/W6618372016","https://openalex.org/W6640376812","https://openalex.org/W6680138032","https://openalex.org/W6684191040","https://openalex.org/W6687751829","https://openalex.org/W6697443983"],"related_works":["https://openalex.org/W2773003563","https://openalex.org/W2951464224","https://openalex.org/W2772166407","https://openalex.org/W2155839910","https://openalex.org/W2604710550","https://openalex.org/W2761785940","https://openalex.org/W2741910023","https://openalex.org/W3191444301","https://openalex.org/W3160398990","https://openalex.org/W3027297840","https://openalex.org/W2965318645","https://openalex.org/W3204476431","https://openalex.org/W2767690801","https://openalex.org/W2964189431","https://openalex.org/W3103844505","https://openalex.org/W2890741129","https://openalex.org/W2949194058","https://openalex.org/W2952533407","https://openalex.org/W2949334740","https://openalex.org/W3128999341"],"abstract_inverted_index":{"The":[0],"goal":[1],"of":[2,10,55,122,148],"fine-grained":[3,171],"image":[4,99,141],"recognition":[5],"is":[6,22,79,113],"to":[7,13,28,115],"recognize":[8],"hundreds":[9],"sub-categories":[11],"affiliating":[12],"the":[14,29,41,56,75,97,123,140,145,157,165],"same":[15],"basic-level":[16],"category":[17],"(e.g.,":[18],"bird":[19],"species).":[20],"It":[21],"a":[23,61,87,106],"highly":[24],"challenging":[25,170],"task":[26],"due":[27],"large":[30],"intra-class":[31],"variance":[32],"and":[33,49,69,156,176],"small":[34],"inter-class":[35],"variance.":[36],"Existing":[37],"approaches":[38,167],"deal":[39],"with":[40],"subtle":[42],"difference":[43],"among":[44],"object":[45],"classes":[46],"via":[47],"learning":[48],"localizing":[50],"discriminative":[51,98],"parts.":[52],"However,":[53],"most":[54],"part":[57,110,131,136,150],"localization":[58,111,132],"methods":[59],"follow":[60],"step-to-step":[62],"manner":[63],"that":[64],"first":[65],"localizes":[66],"larger":[67,76],"parts":[68,73,100,118],"then":[70],"generates":[71],"smaller":[72],"from":[74,119],"ones,":[77],"which":[78,93,143],"not":[80],"efficient.":[81],"In":[82,104],"this":[83],"paper,":[84],"we":[85],"present":[86],"Multi-part":[88],"Convolutional":[89,125],"Attention":[90],"Network":[91],"(M-CAN),":[92],"simultaneously":[94],"focuses":[95],"on":[96,168],"at":[101],"multiple":[102],"scales.":[103],"specific,":[105],"convolutional":[107],"attention":[108],"based":[109],"network":[112,133],"presented":[114],"localize":[116],"multi-scale":[117],"different":[120],"layers":[121],"deep":[124],"Neural":[126],"Networks":[127],"(CNN).":[128],"Importantly,":[129],"our":[130,162],"requires":[134],"no":[135],"annotations":[137],"but":[138],"only":[139],"labels,":[142],"avoids":[144],"heavy":[146],"labor":[147],"complex":[149],"labeling.":[151],"We":[152],"conduct":[153],"comprehensive":[154],"experiments":[155],"experimental":[158],"results":[159],"show":[160],"that,":[161],"method":[163],"outperforms":[164],"state-of-the-art":[166],"three":[169],"datasets,":[172],"including":[173],"CUB-Birds,":[174],"Stanford-Dogs":[175],"Stanford-Cars.":[177]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
