{"id":"https://openalex.org/W4398226350","doi":"https://doi.org/10.1109/tcsvt.2024.3404100","title":"Learning Local Semantic Region Activations for Weakly Supervised Object Localization","display_name":"Learning Local Semantic Region Activations for Weakly Supervised Object Localization","publication_year":2024,"publication_date":"2024-05-22","ids":{"openalex":"https://openalex.org/W4398226350","doi":"https://doi.org/10.1109/tcsvt.2024.3404100"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3404100","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3404100","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023957994","display_name":"Can Xu","orcid":"https://orcid.org/0000-0002-4944-0504"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Can Xu","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030769176","display_name":"Le Hui","orcid":"https://orcid.org/0000-0003-0851-6805"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Le Hui","raw_affiliation_strings":["School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081133385","display_name":"Yuehui Han","orcid":"https://orcid.org/0000-0002-6099-1673"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuehui Han","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047323226","display_name":"Haobo Jiang","orcid":"https://orcid.org/0000-0002-4536-5252"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haobo Jiang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100360558","display_name":"Jiaxin Chen","orcid":"https://orcid.org/0000-0003-0548-4094"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxin Chen","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089409762","display_name":"Jin Xie","orcid":"https://orcid.org/0000-0001-6978-8834"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Xie","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology and the School of Intelligence Science and Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology and the School of Intelligence Science and Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100726984","display_name":"Jian Yang","orcid":"https://orcid.org/0000-0003-4800-832X"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Yang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5023957994"],"corresponding_institution_ids":["https://openalex.org/I36399199"],"apc_list":null,"apc_paid":null,"fwci":1.3901,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.83511752,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"34","issue":"10","first_page":"10182","last_page":"10193"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9889000058174133,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9779000282287598,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6888066530227661},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6338988542556763},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5542864799499512},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41490209102630615},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.41125285625457764},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3992232084274292}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6888066530227661},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6338988542556763},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5542864799499512},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41490209102630615},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41125285625457764},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3992232084274292}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3404100","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3404100","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.75,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1797268635","https://openalex.org/W2110119381","https://openalex.org/W2117539524","https://openalex.org/W2183341477","https://openalex.org/W2295107390","https://openalex.org/W2441255125","https://openalex.org/W2600144439","https://openalex.org/W2752782242","https://openalex.org/W2761785940","https://openalex.org/W2798232928","https://openalex.org/W2798748179","https://openalex.org/W2883554151","https://openalex.org/W2889081631","https://openalex.org/W2911575099","https://openalex.org/W2963045696","https://openalex.org/W2963949812","https://openalex.org/W2963952323","https://openalex.org/W2964028976","https://openalex.org/W2964274719","https://openalex.org/W2979750740","https://openalex.org/W2990371274","https://openalex.org/W2992308087","https://openalex.org/W2994041372","https://openalex.org/W3034315787","https://openalex.org/W3034747217","https://openalex.org/W3035318183","https://openalex.org/W3035712793","https://openalex.org/W3047278355","https://openalex.org/W3082940248","https://openalex.org/W3086763124","https://openalex.org/W3092932168","https://openalex.org/W3102582269","https://openalex.org/W3103376464","https://openalex.org/W3107169861","https://openalex.org/W3110272085","https://openalex.org/W3120636940","https://openalex.org/W3136998836","https://openalex.org/W3142837074","https://openalex.org/W3176171254","https://openalex.org/W3176774696","https://openalex.org/W3188615767","https://openalex.org/W3203593070","https://openalex.org/W3204484221","https://openalex.org/W4200631217","https://openalex.org/W4221167635","https://openalex.org/W4226138051","https://openalex.org/W4289752563","https://openalex.org/W4294982611","https://openalex.org/W4312315124","https://openalex.org/W4312521687","https://openalex.org/W4312570500","https://openalex.org/W4312574296","https://openalex.org/W4313019229","https://openalex.org/W4313069833","https://openalex.org/W4364302321","https://openalex.org/W4386245233","https://openalex.org/W4390871714","https://openalex.org/W6637373629","https://openalex.org/W6675803743","https://openalex.org/W6779430525","https://openalex.org/W6783298742","https://openalex.org/W6788135285"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Weakly":[0],"supervised":[1],"object":[2],"localization":[3],"(WSOL)":[4],"aims":[5],"to":[6,39,49,52,81,144,162,175,190],"train":[7],"instance-level":[8],"locators":[9],"by":[10,268],"exploiting":[11],"accessible":[12],"image-level":[13],"labels.":[14],"By":[15],"multiplying":[16],"channel-wise":[17],"features":[18],"with":[19,221,235,245],"classification":[20],"weights":[21,73,205],"and":[22,70,91,111,125,232,242,248,254,271],"then":[23],"adding":[24],"them":[25],"together,":[26],"most":[27],"prior":[28],"works":[29],"follow":[30],"the":[31,34,41,59,75,83,93,101,104,112,147,164,172,177,192,212,215,239,265],"pipeline":[32],"of":[33,62,88,103,150,179],"Class":[35],"Activation":[36],"Map":[37],"(CAM)":[38],"collect":[40],"semantic":[42,86,148],"responses,":[43],"thereby":[44],"highlighting":[45],"regions":[46,110],"that":[47,228],"contribute":[48],"class":[50,60],"prediction":[51],"achieve":[53],"WSOL.":[54,134],"However,":[55],"CAM-based":[56],"methods":[57],"treat":[58],"contributions":[61],"all":[63,208],"pixel":[64,152],"positions":[65],"in":[66,100],"a":[67,120,139,159,185,222,246],"channel":[68,90],"equally":[69],"assign":[71,202],"dominant":[72],"for":[74,132],"discriminative":[76],"channels":[77],"biasedly.":[78],"This":[79],"fails":[80],"express":[82],"fine-grained":[84],"pixel-level":[85],"response":[87,149],"each":[89,151],"model":[92],"complex":[94],"contextual":[95],"relations":[96],"between":[97,107,166,195],"channels,":[98],"resulting":[99],"mixup":[102],"activation":[105,123,141],"value":[106],"non-discriminative":[108],"foreground":[109,223],"background.":[113],"To":[114],"alleviate":[115],"these":[116],"issues,":[117],"we":[118,136,157],"present":[119],"Local":[121],"Semantic":[122],"enhancement":[124],"Global":[126],"Spatial":[127],"correlation":[128,194],"mining":[129],"network":[130],"(LSGS-Net)":[131],"accurate":[133],"Specifically,":[135],"first":[137],"propose":[138,184],"local":[140,168,180,197,209],"generation":[142],"module":[143,189],"explicitly":[145],"learn":[146],"position":[153],"from":[154],"channels.":[155],"Then,":[156],"design":[158],"regularization":[160],"loss":[161],"supervise":[163],"consistency":[165],"similar":[167],"activations,":[169,198],"which":[170,199],"utilizes":[171],"cross-image":[173],"information":[174],"improve":[176],"accuracy":[178],"activations.":[181],"We":[182],"further":[183],"K-nearest":[186],"Neighbors":[187],"graph":[188],"capture":[191],"spatial":[193],"different":[196],"can":[200],"adaptively":[201],"more":[203],"proper":[204],"when":[206],"fusing":[207],"activation.":[210],"In":[211],"inference":[213],"stage,":[214],"bounding":[216],"box":[217],"will":[218],"be":[219],"determined":[220],"threshold.":[224],"Extensive":[225],"experiments":[226],"show":[227],"LSGS-Net":[229,262],"achieves":[230],"significant":[231],"consistent":[233],"improvement":[234],"various":[236],"backbones":[237],"on":[238,252,260],"CUB,":[240],"ILSVRC,":[241,255],"OpenImages":[243],"benchmarks,":[244],"97.5%":[247],"75.3%":[249],"GT-Known":[250],"LOC":[251],"CUB":[253],"respectively.":[256],"For":[257],"segmentation":[258],"quality":[259],"OpenImages,":[261],"already":[263],"exceeds":[264],"SOTA":[266],"method":[267],"1.2%":[269],"pIoU":[270],"1.9%":[272],"PxAP.":[273]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
