{"id":"https://openalex.org/W3129338559","doi":"https://doi.org/10.1109/tmm.2021.3061284","title":"Fine-Grained Categorization From RGB-D Images","display_name":"Fine-Grained Categorization From RGB-D Images","publication_year":2021,"publication_date":"2021-02-23","ids":{"openalex":"https://openalex.org/W3129338559","doi":"https://doi.org/10.1109/tmm.2021.3061284","mag":"3129338559"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2021.3061284","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3061284","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067748062","display_name":"Yanhao Tan","orcid":"https://orcid.org/0000-0003-4296-5241"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanhao Tan","raw_affiliation_strings":["School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102828803","display_name":"Mohammad Muntasir Rahman","orcid":null},"institutions":[{"id":"https://openalex.org/I40279923","display_name":"Islamic University","ror":"https://ror.org/04j1w0q97","country_code":"BD","type":"education","lineage":["https://openalex.org/I40279923"]},{"id":"https://openalex.org/I4210113480","display_name":"Mohamed bin Zayed University of Artificial Intelligence","ror":"https://ror.org/0258gkt32","country_code":"AE","type":"education","lineage":["https://openalex.org/I4210113480"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["AE","BD","CN"],"is_corresponding":false,"raw_author_name":"Mohammad Muntasir Rahman","raw_affiliation_strings":["Department of Computer Science and Engineering, Islamic University, Kushtia, Bangladesh","Mohamed bin Zayed University of Artificial Intelligence, Abu Dhabi, UAE","School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Islamic University, Kushtia, Bangladesh","institution_ids":["https://openalex.org/I40279923"]},{"raw_affiliation_string":"Mohamed bin Zayed University of Artificial Intelligence, Abu Dhabi, UAE","institution_ids":["https://openalex.org/I4210113480"]},{"raw_affiliation_string":"School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087535289","display_name":"Yanfu Yan","orcid":"https://orcid.org/0009-0008-2475-6802"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanfu Yan","raw_affiliation_strings":["School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100763213","display_name":"Jian Xue","orcid":"https://orcid.org/0000-0002-9460-802X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Xue","raw_affiliation_strings":["School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082634513","display_name":"Ling Shao","orcid":"https://orcid.org/0000-0002-8264-6117"},"institutions":[{"id":"https://openalex.org/I4210116052","display_name":"Inception Institute of Artificial Intelligence","ror":"https://ror.org/02664zk40","country_code":"AE","type":"facility","lineage":["https://openalex.org/I4210116052"]}],"countries":["AE"],"is_corresponding":false,"raw_author_name":"Ling Shao","raw_affiliation_strings":["Inception Institute of Artificial Intelligence, Abu Dhabi, UAE"],"affiliations":[{"raw_affiliation_string":"Inception Institute of Artificial Intelligence, Abu Dhabi, UAE","institution_ids":["https://openalex.org/I4210116052"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072833759","display_name":"Ke L\u00fc","orcid":"https://orcid.org/0000-0003-0176-3088"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Lu","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, Guangdong, China","School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210136793"]},{"raw_affiliation_string":"School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5067748062"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.2907,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.53252625,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"24","issue":null,"first_page":"917","last_page":"928"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10616","display_name":"Smart Agriculture and AI","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8731514811515808},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.8083226680755615},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.8000271320343018},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7514424324035645},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.694555401802063},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5979630947113037},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.4543962776660919},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4529482424259186},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4417738914489746},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4373733401298523},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3680686950683594}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8731514811515808},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.8083226680755615},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.8000271320343018},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7514424324035645},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.694555401802063},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5979630947113037},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.4543962776660919},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4529482424259186},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4417738914489746},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4373733401298523},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3680686950683594},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2021.3061284","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3061284","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1825513639","display_name":null,"funder_award_id":"61972375","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1967286088","display_name":null,"funder_award_id":"61671426","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2973092727","display_name":null,"funder_award_id":"62032022","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4140602880","display_name":null,"funder_award_id":"61871258","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6458045927","display_name":null,"funder_award_id":"4182071","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"},{"id":"https://openalex.org/G6917360456","display_name":null,"funder_award_id":"61929104","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7616891426","display_name":null,"funder_award_id":"Y95401YXX2","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W56385144","https://openalex.org/W125693051","https://openalex.org/W1533417424","https://openalex.org/W1565402342","https://openalex.org/W1797268635","https://openalex.org/W1955942245","https://openalex.org/W1977295328","https://openalex.org/W1995113806","https://openalex.org/W2005756025","https://openalex.org/W2021851106","https://openalex.org/W2074099390","https://openalex.org/W2104657103","https://openalex.org/W2108598243","https://openalex.org/W2138011018","https://openalex.org/W2150856297","https://openalex.org/W2155893237","https://openalex.org/W2156222070","https://openalex.org/W2163309385","https://openalex.org/W2194775991","https://openalex.org/W2219155316","https://openalex.org/W2337845395","https://openalex.org/W2397854647","https://openalex.org/W2475098969","https://openalex.org/W2569298377","https://openalex.org/W2604134068","https://openalex.org/W2606128082","https://openalex.org/W2737725206","https://openalex.org/W2748826260","https://openalex.org/W2750980686","https://openalex.org/W2752585553","https://openalex.org/W2780418809","https://openalex.org/W2794721028","https://openalex.org/W2798365843","https://openalex.org/W2798913983","https://openalex.org/W2891054863","https://openalex.org/W2891951760","https://openalex.org/W2895359088","https://openalex.org/W2901017177","https://openalex.org/W2904332125","https://openalex.org/W2909381593","https://openalex.org/W2930080648","https://openalex.org/W2945472816","https://openalex.org/W2946009298","https://openalex.org/W2951730755","https://openalex.org/W2953915809","https://openalex.org/W2954146807","https://openalex.org/W2962798895","https://openalex.org/W2963066927","https://openalex.org/W2963148524","https://openalex.org/W2963150697","https://openalex.org/W2963956866","https://openalex.org/W2963966654","https://openalex.org/W2989786816","https://openalex.org/W3001668482","https://openalex.org/W3034687313","https://openalex.org/W3099903704","https://openalex.org/W3100930215","https://openalex.org/W4246193833","https://openalex.org/W6600609147","https://openalex.org/W6637373629","https://openalex.org/W6638319203","https://openalex.org/W6638677478","https://openalex.org/W6764782982"],"related_works":["https://openalex.org/W2774550181","https://openalex.org/W2524507886","https://openalex.org/W2283162247","https://openalex.org/W2052518016","https://openalex.org/W3082551657","https://openalex.org/W2085956791","https://openalex.org/W2081022503","https://openalex.org/W2767823485","https://openalex.org/W2407156159","https://openalex.org/W2822883015"],"abstract_inverted_index":{"In":[0,78],"the":[1,59,92,176],"field":[2],"of":[3,13,28,61,105,155,166,181],"computer":[4,49],"vision,":[5],"fine-grained":[6,76,89,179],"visual":[7],"categorization":[8,180],"has":[9],"attracted":[10],"a":[11,25,83,114,142],"lot":[12],"attention":[14],"and":[15,24,43,66,102,108,110,132,164],"made":[16],"great":[17],"progress":[18],"due":[19],"to":[20,122],"convolutional":[21],"neural":[22],"networks":[23,157],"large":[26],"number":[27],"publicly":[29],"available":[30],"datasets.":[31],"With":[32],"next-generation":[33],"sensing":[34],"technology,":[35],"RGB-D":[36,53,85,97,182],"cameras":[37,54],"can":[38,151],"provide":[39,118],"high-quality":[40],"synchronized":[41],"RGB":[42],"depth":[44],"images":[45,98],"for":[46,88,126,134,178],"solving":[47],"many":[48],"vision":[50],"problems.":[51],"Although":[52],"have":[55,70],"been":[56,72],"used":[57,74],"in":[58,75,113],"context":[60],"multi-view":[62],"object":[63],"category":[64],"detection":[65],"scene":[67],"understanding,":[68],"they":[69],"not":[71],"widely":[73],"classification.":[77],"this":[79],"paper,":[80],"we":[81],"introduce":[82],"multiview":[84],"dataset":[86,93],"RGBD-FG":[87],"categorization.":[90],"Currently,":[91],"contains":[94],"93":[95],"051":[96],"covering":[99],"19":[100],"super-categories":[101],"50":[103],"sub-categories":[104],"common":[106],"vegetables":[107],"fruit,":[109],"is":[111],"organized":[112],"hierarchical":[115],"manner.":[116],"We":[117,139,170],"extensive":[119],"experimental":[120],"results":[121],"establish":[123],"state-of-the-art":[124],"benchmarks":[125],"our":[127,173],"dataset,":[128],"illustrating":[129],"its":[130],"diversity":[131],"scope":[133],"improvement":[135],"through":[136],"future":[137],"work.":[138],"also":[140],"propose":[141],"novel":[143],"modality-specific":[144],"multimodal":[145,156],"network":[146],"called":[147],"FS-Multimodal":[148],"network,":[149],"which":[150],"solve":[152],"two":[153],"limitations":[154],"trained":[158],"based":[159],"on":[160],"fine-tuning":[161],"techniques:":[162],"over-fitting":[163],"lack":[165],"effective":[167],"depth-specific":[168],"features.":[169],"hope":[171],"that":[172],"study":[174],"lays":[175],"foundations":[177],"data.":[183]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
