{"id":"https://openalex.org/W3047362981","doi":"https://doi.org/10.1109/tip.2021.3099733","title":"HCE: Hierarchical Context Embedding for Region-Based Object Detection","display_name":"HCE: Hierarchical Context Embedding for Region-Based Object Detection","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3047362981","doi":"https://doi.org/10.1109/tip.2021.3099733","mag":"3047362981","pmid":"https://pubmed.ncbi.nlm.nih.gov/34339371"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2021.3099733","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2021.3099733","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2008.01338","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zhao-Min Chen","orcid":"https://orcid.org/0000-0001-9492-0796"},"institutions":[{"id":"https://openalex.org/I146620803","display_name":"Wenzhou University","ror":"https://ror.org/020hxh324","country_code":"CN","type":"education","lineage":["https://openalex.org/I146620803"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhao-Min Chen","raw_affiliation_strings":["College of Computer Science and Artificial Intelligence, Wenzhou University, Wenzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Artificial Intelligence, Wenzhou University, Wenzhou, China","institution_ids":["https://openalex.org/I146620803"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xin Jin","orcid":"https://orcid.org/0000-0001-5508-7957"},"institutions":[{"id":"https://openalex.org/I4210155230","display_name":"Samsung (China)","ror":"https://ror.org/04yt00889","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210155230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Jin","raw_affiliation_strings":["Samsung Research Nanjing, Samsung Research, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Samsung Research Nanjing, Samsung Research, Nanjing, China","institution_ids":["https://openalex.org/I4210155230"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Bo-Rui Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo-Rui Zhao","raw_affiliation_strings":["Megvii Research Nanjing, Megvii Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Megvii Research Nanjing, Megvii Technology, Nanjing, China","institution_ids":["https://openalex.org/I4401726805"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xiaoqin Zhang","orcid":"https://orcid.org/0000-0003-0958-7285"},"institutions":[{"id":"https://openalex.org/I146620803","display_name":"Wenzhou University","ror":"https://ror.org/020hxh324","country_code":"CN","type":"education","lineage":["https://openalex.org/I146620803"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoqin Zhang","raw_affiliation_strings":["College of Computer Science and Artificial Intelligence, Wenzhou University, Wenzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Artificial Intelligence, Wenzhou University, Wenzhou, China","institution_ids":["https://openalex.org/I146620803"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yanwen Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanwen Guo","raw_affiliation_strings":["National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I146620803"],"apc_list":null,"apc_paid":null,"fwci":2.1362,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.89020843,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"30","issue":null,"first_page":"6917","last_page":"6929"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7333999872207642,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7333999872207642,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.1307000070810318,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.024800000712275505,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6978999972343445},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6011999845504761},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5741999745368958},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5327000021934509},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5109999775886536},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4708999991416931},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.4562000036239624},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4388999938964844}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7878000140190125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7465000152587891},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6978999972343445},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6011999845504761},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5741999745368958},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5327000021934509},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5109999775886536},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.508400022983551},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4708999991416931},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.4562000036239624},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4388999938964844},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4374000132083893},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4221999943256378},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.37229999899864197},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.35910001397132874},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3244999945163727},{"id":"https://openalex.org/C34146451","wikidata":"https://www.wikidata.org/wiki/Q5048094","display_name":"Cascade","level":2,"score":0.3102000057697296},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C182521987","wikidata":"https://www.wikidata.org/wiki/Q2493877","display_name":"Viola\u2013Jones object detection framework","level":5,"score":0.29409998655319214},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.26089999079704285}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tip.2021.3099733","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2021.3099733","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:34339371","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34339371","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null},{"id":"pmh:oai:arXiv.org:2008.01338","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.01338","pdf_url":"https://arxiv.org/pdf/2008.01338","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2008.01338","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2008.01338","pdf_url":"https://arxiv.org/pdf/2008.01338","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G133414184","display_name":null,"funder_award_id":"U2033210","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G346084562","display_name":null,"funder_award_id":"LR17F030001","funder_id":"https://openalex.org/F4320338464","funder_display_name":"Natural Science Foundation of Zhejiang Province"},{"id":"https://openalex.org/G3796144338","display_name":null,"funder_award_id":"61922064","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G448318003","display_name":null,"funder_award_id":"C20170008","funder_id":"https://openalex.org/F4320336615","funder_display_name":"Science and Technology Plan Project of Wenzhou, China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336615","display_name":"Science and Technology Plan Project of Wenzhou, China","ror":null},{"id":"https://openalex.org/F4320338464","display_name":"Natural Science Foundation of Zhejiang Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1536680647","https://openalex.org/W1587447546","https://openalex.org/W1934621328","https://openalex.org/W2081293863","https://openalex.org/W2088049833","https://openalex.org/W2102605133","https://openalex.org/W2108598243","https://openalex.org/W2111868822","https://openalex.org/W2133324800","https://openalex.org/W2519284461","https://openalex.org/W2534457893","https://openalex.org/W2565639579","https://openalex.org/W2601564443","https://openalex.org/W2740832349","https://openalex.org/W2800283575","https://openalex.org/W2884068670","https://openalex.org/W2886904239","https://openalex.org/W2895403383","https://openalex.org/W2963037989","https://openalex.org/W2963091558","https://openalex.org/W2963150697","https://openalex.org/W2963300078","https://openalex.org/W2963351448","https://openalex.org/W2963603913","https://openalex.org/W2963857746","https://openalex.org/W2964241181","https://openalex.org/W2964444661","https://openalex.org/W2965391153","https://openalex.org/W2966926453","https://openalex.org/W2982770724","https://openalex.org/W2984816230","https://openalex.org/W2988452521","https://openalex.org/W3034779842","https://openalex.org/W3034971973","https://openalex.org/W3163225208","https://openalex.org/W3191338014","https://openalex.org/W6620707391","https://openalex.org/W6639102338","https://openalex.org/W6714138976","https://openalex.org/W6729983426","https://openalex.org/W6743749281","https://openalex.org/W6750227808","https://openalex.org/W6753412334","https://openalex.org/W6754632766","https://openalex.org/W6761115386","https://openalex.org/W6764322716","https://openalex.org/W6785652829"],"related_works":[],"abstract_inverted_index":{"State-of-the-art":[0],"two-stage":[1],"object":[2,12,107],"detectors":[3,95],"apply":[4],"a":[5,8,68,82,91],"classifier":[6],"to":[7,85,101,122,149,154,180,200,227],"sparse":[9],"set":[10],"of":[11,30,90,93,105,158,185,231],"proposals,":[13],"relying":[14],"on":[15],"region-wise":[16,26],"features":[17,129],"extracted":[18],"by":[19,96,132],"RoIPool":[20],"or":[21],"RoIAlign":[22],"as":[23,53,55,81],"inputs.":[24],"The":[25],"features,":[27,163],"in":[28],"spite":[29],"aligning":[31],"well":[32,54],"with":[33],"the":[34,40,87,103,118,166,182,229],"proposal":[35],"locations,":[36],"may":[37],"still":[38],"lack":[39],"crucial":[41],"context":[42,121,136],"information":[43,137],"which":[44,77,116,145,176],"is":[45,195],"necessary":[46],"for":[47,238],"filtering":[48],"out":[49],"noisy":[50],"background":[51],"detections,":[52],"recognizing":[56],"objects":[57],"possessing":[58],"no":[59],"distinctive":[60],"appearances.":[61],"To":[62],"address":[63],"this":[64],"issue,":[65],"we":[66,109,164],"present":[67],"simple":[69,218],"but":[70],"effective":[71],"Hierarchical":[72],"Context":[73],"Embedding":[74],"(HCE)":[75],"framework,":[76],"can":[78,177,223],"be":[79,178,224],"applied":[80],"plug-and-play":[83],"component,":[84],"facilitate":[86],"classification":[88,183],"ability":[89],"series":[92],"region-based":[94,186,207],"mining":[97],"contextual":[98,161],"cues.":[99],"Specifically,":[100],"advance":[102],"recognition":[104],"context-dependent":[106],"categories,":[108],"propose":[110,165],"an":[111],"image-level":[112,120],"categorical":[113],"embedding":[114],"module":[115],"leverages":[117],"holistic":[119],"learn":[123],"object-level":[124],"concepts.":[125],"Then,":[126],"novel":[127],"RoI":[128,151,162],"are":[130,146],"generated":[131],"exploiting":[133],"hierarchically":[134],"embedded":[135],"beneath":[138],"both":[139],"whole":[140],"images":[141],"and":[142,173,197,202,215,234,241],"interested":[143],"regions,":[144],"also":[147],"complementary":[148],"conventional":[150],"features.":[152],"Moreover,":[153],"make":[155],"full":[156],"use":[157],"our":[159,192,220],"hierarchical":[160],"early-and-late":[167],"fusion":[168,172],"strategies":[169],"(i.e.,":[170],"feature":[171],"confidence":[174],"fusion),":[175],"combined":[179],"boost":[181],"accuracy":[184],"detectors.":[187],"Comprehensive":[188],"experiments":[189],"demonstrate":[190],"that":[191],"HCE":[193,221],"framework":[194,222],"flexible":[196],"generalizable,":[198],"leading":[199],"significant":[201],"consistent":[203],"improvements":[204],"upon":[205],"various":[206],"detectors,":[208,233],"including":[209],"FPN,":[210],"Cascade":[211],"R-CNN,":[212],"Mask":[213],"R-CNN":[214],"PA-FPN.":[216],"With":[217],"modification,":[219],"conveniently":[225],"adapted":[226],"fit":[228],"structure":[230],"one-stage":[232],"achieve":[235],"improved":[236],"performance":[237],"SSD,":[239],"RetinaNet":[240],"EfficientDet.":[242]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":7}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2020-08-10T00:00:00"}
