{"id":"https://openalex.org/W4310330865","doi":"https://doi.org/10.1109/tnnls.2022.3218471","title":"TS-CAM: Token Semantic Coupled Attention Map for Weakly Supervised Object Localization","display_name":"TS-CAM: Token Semantic Coupled Attention Map for Weakly Supervised Object Localization","publication_year":2022,"publication_date":"2022-11-24","ids":{"openalex":"https://openalex.org/W4310330865","doi":"https://doi.org/10.1109/tnnls.2022.3218471","pmid":"https://pubmed.ncbi.nlm.nih.gov/36417732"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2022.3218471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3218471","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103072099","display_name":"Yuan Yao","orcid":"https://orcid.org/0000-0002-3616-2496"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuan Yao","raw_affiliation_strings":["School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052317536","display_name":"Fang Wan","orcid":"https://orcid.org/0000-0002-8083-9257"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fang Wan","raw_affiliation_strings":["School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102910220","display_name":"Wei Gao","orcid":"https://orcid.org/0000-0003-0939-8214"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Gao","raw_affiliation_strings":["School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067338071","display_name":"Xingjia Pan","orcid":"https://orcid.org/0000-0003-3699-8936"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingjia Pan","raw_affiliation_strings":["Youtu Laboratory, Tencent, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Youtu Laboratory, Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038511307","display_name":"Zhiliang Peng","orcid":"https://orcid.org/0000-0002-6643-9329"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiliang Peng","raw_affiliation_strings":["School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100393506","display_name":"Qi Tian","orcid":"https://orcid.org/0000-0002-7252-5047"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Tian","raw_affiliation_strings":["Huawei Noah&#x2019;s Ark Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Huawei Noah&#x2019;s Ark Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015317495","display_name":"Qixiang Ye","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qixiang Ye","raw_affiliation_strings":["School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics, Electrical and Communication Engineering, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5103072099"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":2.9557,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.92596669,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"35","issue":"7","first_page":"9109","last_page":"9121"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7831299304962158},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6875303983688354},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6443901062011719},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6048291325569153},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5987063646316528},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5791586637496948},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5030147433280945},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46863341331481934},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43202924728393555},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10798200964927673}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7831299304962158},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6875303983688354},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6443901062011719},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6048291325569153},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5987063646316528},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5791586637496948},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5030147433280945},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46863341331481934},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43202924728393555},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10798200964927673},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2022.3218471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2022.3218471","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:36417732","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36417732","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.75,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1295000622","display_name":null,"funder_award_id":"61836012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2088458048","display_name":null,"funder_award_id":"62006216","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G622688436","display_name":null,"funder_award_id":"XDA27000000","funder_id":"https://openalex.org/F4320321133","funder_display_name":"Chinese Academy of Sciences"},{"id":"https://openalex.org/G6735075065","display_name":null,"funder_award_id":"62225208","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W1482209366","https://openalex.org/W2110523656","https://openalex.org/W2521627374","https://openalex.org/W2981954115","https://openalex.org/W1177522693"],"abstract_inverted_index":{"Weakly":[0],"supervised":[1],"object":[2,7,31,36,54,113,138,167,187,219],"localization":[3,8,220],"(WSOL),":[4],"which":[5,49,95,161],"trains":[6],"models":[9],"using":[10],"solely":[11],"image":[12,129],"category":[13,139],"annotations,":[14],"remains":[15],"a":[16,131],"challenging":[17],"problem.":[18],"Existing":[19],"approaches":[20],"based":[21],"on":[22,39,201,221],"convolutional":[23],"neural":[24],"networks":[25],"(CNNs)":[26],"tend":[27],"to":[28,52,67,72,130,141,148,164,173],"miss":[29],"full":[30],"extent":[32],"while":[33],"activating":[34],"discriminative":[35],"parts.":[37],"Based":[38],"our":[40],"analysis,":[41],"this":[42,60],"is":[43,228],"caused":[44],"by":[45,79,126,197],"CNN's":[46],"intrinsic":[47],"characteristics,":[48],"experiences":[50],"difficulty":[51],"capture":[53,73,112],"semantics":[55,99,104,114,147],"at":[56,115,230],"long":[57,116],"distances.":[58],"In":[59],"article,":[61],"we":[62,178],"introduce":[63],"the":[64,70,87,103,181,208,222],"vision":[65],"transformer":[66],"WSOL,":[68],"with":[69,105,158,210],"aim":[71],"long-range":[74],"semantic":[75,89,171],"dependency":[76],"of":[77,133,183],"features":[78],"leveraging":[80],"transformer's":[81],"cascaded":[82],"self-attention":[83],"mechanism.":[84],"We":[85],"propose":[86],"token":[88],"coupled":[90,157],"attention":[91,106,159,176],"map":[92],"(TS-CAM)":[93],"method,":[94],"first":[96],"decomposes":[97],"class-aware":[98],"and":[100,118,199,203],"then":[101],"couples":[102],"maps":[107,160],"for":[108,185,217],"semantic-aware":[109,166,175],"activation.":[110],"To":[111,136],"distances":[117],"avoid":[119],"partial":[120],"activation,":[121],"TS-CAM":[122,144,184,192,213],"performs":[123],"spatial":[124],"embedding":[125],"partitioning":[127],"an":[128],"set":[132],"patch":[134,142,150,153],"tokens.":[135],"incorporate":[137],"information":[140],"tokens,":[143],"reallocates":[145],"category-related":[146],"each":[149],"token.":[151],"The":[152,226],"tokens":[154,172],"are":[155,162],"finally":[156],"semantic-agnostic":[163],"perform":[165],"localization.":[168,188],"By":[169],"introducing":[170],"produce":[174],"maps,":[177],"further":[179],"explore":[180],"capability":[182],"multicategory":[186,218],"Experiments":[189],"show":[190],"that":[191],"outperforms":[193],"its":[194],"CNN-CAM":[195],"counterpart":[196],"11.6%":[198],"28.9%":[200],"ILSVRC":[202],"CUB-200-2011":[204],"datasets,":[205],"respectively,":[206],"improving":[207],"state-of-the-art":[209],"large":[211],"margins.":[212],"also":[214],"demonstrates":[215],"superiority":[216],"Pascal":[223],"VOC":[224],"dataset.":[225],"code":[227],"available":[229],"github.com/yuanyao366/ts-cam-extension.":[231]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":6}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
