{"id":"https://openalex.org/W2990154684","doi":"https://doi.org/10.1109/tmm.2019.2954747","title":"Bidirectional Attention-Recognition Model for Fine-Grained Object Classification","display_name":"Bidirectional Attention-Recognition Model for Fine-Grained Object Classification","publication_year":2019,"publication_date":"2019-11-20","ids":{"openalex":"https://openalex.org/W2990154684","doi":"https://doi.org/10.1109/tmm.2019.2954747","mag":"2990154684"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2019.2954747","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2954747","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059194547","display_name":"Chuanbin Liu","orcid":"https://orcid.org/0000-0002-2840-6235"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuanbin Liu","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078162380","display_name":"Hongtao Xie","orcid":"https://orcid.org/0000-0002-6249-5315"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongtao Xie","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003217535","display_name":"Zheng-Jun Zha","orcid":"https://orcid.org/0000-0003-2510-8993"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengjun Zha","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089799495","display_name":"Lingyun Yu","orcid":"https://orcid.org/0000-0001-6403-761X"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lingyun Yu","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012931772","display_name":"Zhineng Chen","orcid":"https://orcid.org/0000-0002-0182-3207"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhineng Chen","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046305086","display_name":"Yongdong Zhang","orcid":"https://orcid.org/0000-0002-1151-1792"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongdong Zhang","raw_affiliation_strings":["School of Information Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5059194547"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":3.883,"has_fulltext":false,"cited_by_count":64,"citation_normalized_percentile":{"value":0.94975264,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"22","issue":"7","first_page":"1785","last_page":"1795"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8095018267631531},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.7368525862693787},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6441022157669067},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.568324089050293},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5360406041145325},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.514889121055603},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.5022845268249512},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4860380291938782},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.48058032989501953},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45869559049606323},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4430181682109833},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4288488030433655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8095018267631531},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.7368525862693787},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6441022157669067},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.568324089050293},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5360406041145325},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.514889121055603},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.5022845268249512},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4860380291938782},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.48058032989501953},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45869559049606323},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4430181682109833},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4288488030433655},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2019.2954747","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2954747","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.6800000071525574,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G4204336864","display_name":null,"funder_award_id":"2017YFC0820600","funder_id":"https://openalex.org/F4320336026","funder_display_name":"National Key Research and Development Program of China Stem Cell and Translational Research"},{"id":"https://openalex.org/G5616149779","display_name":null,"funder_award_id":"61771468","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7532226545","display_name":null,"funder_award_id":"2017209","funder_id":"https://openalex.org/F4320322847","funder_display_name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences"},{"id":"https://openalex.org/G8290336390","display_name":null,"funder_award_id":"61525206","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322847","display_name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences","ror":"https://ror.org/031141b54"},{"id":"https://openalex.org/F4320336026","display_name":"National Key Research and Development Program of China Stem Cell and Translational Research","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":93,"referenced_works":["https://openalex.org/W56385144","https://openalex.org/W639708223","https://openalex.org/W1616462885","https://openalex.org/W1686810756","https://openalex.org/W1797268635","https://openalex.org/W1846799578","https://openalex.org/W1898560071","https://openalex.org/W1928906481","https://openalex.org/W1955942245","https://openalex.org/W1977295328","https://openalex.org/W1995525705","https://openalex.org/W2023316690","https://openalex.org/W2028017042","https://openalex.org/W2083097051","https://openalex.org/W2088049833","https://openalex.org/W2102605133","https://openalex.org/W2104657103","https://openalex.org/W2108862644","https://openalex.org/W2129955511","https://openalex.org/W2138011018","https://openalex.org/W2142697503","https://openalex.org/W2163605009","https://openalex.org/W2194775991","https://openalex.org/W2211589372","https://openalex.org/W2289708887","https://openalex.org/W2306952455","https://openalex.org/W2322020277","https://openalex.org/W2440198081","https://openalex.org/W2460852148","https://openalex.org/W2474309084","https://openalex.org/W2479109623","https://openalex.org/W2510373542","https://openalex.org/W2533598788","https://openalex.org/W2555741539","https://openalex.org/W2579985080","https://openalex.org/W2613718673","https://openalex.org/W2618530766","https://openalex.org/W2621368668","https://openalex.org/W2737725206","https://openalex.org/W2741166240","https://openalex.org/W2744043447","https://openalex.org/W2746314669","https://openalex.org/W2747685395","https://openalex.org/W2758150123","https://openalex.org/W2763070548","https://openalex.org/W2765407302","https://openalex.org/W2773003563","https://openalex.org/W2783482415","https://openalex.org/W2798365843","https://openalex.org/W2804047946","https://openalex.org/W2807931652","https://openalex.org/W2808269424","https://openalex.org/W2883888092","https://openalex.org/W2891951760","https://openalex.org/W2896025697","https://openalex.org/W2912371042","https://openalex.org/W2916724381","https://openalex.org/W2938603906","https://openalex.org/W2942181934","https://openalex.org/W2951464224","https://openalex.org/W2963045696","https://openalex.org/W2963399829","https://openalex.org/W2963403868","https://openalex.org/W2963407932","https://openalex.org/W2963446712","https://openalex.org/W2964036919","https://openalex.org/W2997351497","https://openalex.org/W2998508940","https://openalex.org/W3103844505","https://openalex.org/W3106250896","https://openalex.org/W3124951096","https://openalex.org/W4295727797","https://openalex.org/W4385245566","https://openalex.org/W6636475194","https://openalex.org/W6637373629","https://openalex.org/W6638319203","https://openalex.org/W6638677478","https://openalex.org/W6640376812","https://openalex.org/W6679091853","https://openalex.org/W6681009388","https://openalex.org/W6698041030","https://openalex.org/W6732243160","https://openalex.org/W6739901393","https://openalex.org/W6742261329","https://openalex.org/W6743428213","https://openalex.org/W6743440100","https://openalex.org/W6745136726","https://openalex.org/W6747939174","https://openalex.org/W6751795773","https://openalex.org/W6752285806","https://openalex.org/W6758704467","https://openalex.org/W6759451268","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W4385957992","https://openalex.org/W4229079080","https://openalex.org/W4206534706","https://openalex.org/W4385965371","https://openalex.org/W4386025632","https://openalex.org/W2912445262","https://openalex.org/W3006943036","https://openalex.org/W4382142108","https://openalex.org/W2546942002","https://openalex.org/W3195820617"],"abstract_inverted_index":{"Fine-grained":[0],"object":[1,157],"classification":[2,193],"(FGOC)":[3],"is":[4,117,169],"a":[5,39,70,78,114,144,162,198],"challenging":[6],"research":[7],"topic":[8],"in":[9,69,130,143,192,208],"multimedia":[10],"computing":[11],"with":[12,31,204],"machine":[13],"learning,":[14],"which":[15],"faces":[16],"two":[17],"pivotal":[18],"conundrums:":[19],"focusing":[20],"attention":[21,97,123,133],"on":[22,181],"the":[23,32,46,52,58,86,122,132,136,148,188,205],"discriminate":[24,47,100],"part":[25,61,101],"regions,":[26],"and":[27,49,63,104,111,135,147,171,176,201],"then":[28,50],"processing":[29],"recognition":[30,65,106,127,137],"part-based":[33,53],"features.":[34,54],"Existing":[35],"approaches":[36],"generally":[37],"adopt":[38],"unidirectional":[40],"two-step":[41],"structure,":[42],"that":[43,60],"first":[44],"locate":[45],"parts":[48,159],"recognize":[51],"However,":[55],"they":[56],"neglect":[57],"truth":[59],"localization":[62],"feature":[64,109],"can":[66,139,151],"be":[67,152],"reinforced":[68],"bidirectional":[71,80,87,145],"process.":[72],"In":[73],"this":[74],"paper,":[75],"we":[76],"propose":[77],"novel":[79,163],"attention-recognition":[81],"model":[82],"(BARM)":[83],"to":[84,120],"actualize":[85],"reinforcement":[88],"for":[89,99,108,178],"FGOC.":[90,179],"The":[91],"proposed":[92],"BARM":[93,131,186,196],"consists":[94],"of":[95],"one":[96,105],"agent":[98,107,124,134,138],"regions":[102],"proposing":[103],"extraction":[110],"recognition.":[112],"Meanwhile,":[113],"feedback":[115],"flow":[116],"creatively":[118],"established":[119],"optimize":[121],"directly":[125],"by":[126],"agent.":[128],"Therefore,":[129],"reinforce":[140],"each":[141],"other":[142],"way":[146],"overall":[149],"framework":[150],"trained":[153],"end-to-end":[154],"without":[155],"neither":[156],"nor":[158],"annotations.":[160],"Moreover,":[161],"Multiple":[164],"Random":[165],"Erasing":[166],"data":[167],"augmentation":[168],"proposed,":[170],"it":[172],"exhibits":[173,197],"impressive":[174],"pertinency":[175],"superiority":[177],"Conducted":[180],"several":[182],"extensive":[183],"FGOC":[184],"benchmarks,":[185],"outperforms":[187],"present":[189],"state-of-the-art":[190],"methods":[191],"accuracy.":[194],"Furthermore,":[195],"clear":[199],"interpretability":[200],"keeps":[202],"consistent":[203],"human":[206],"perception":[207],"visualization":[209],"experiments.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":6}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
