{"id":"https://openalex.org/W4389352357","doi":"https://doi.org/10.1109/tpami.2023.3339628","title":"Context Disentangling and Prototype Inheriting for Robust Visual Grounding","display_name":"Context Disentangling and Prototype Inheriting for Robust Visual Grounding","publication_year":2023,"publication_date":"2023-12-05","ids":{"openalex":"https://openalex.org/W4389352357","doi":"https://doi.org/10.1109/tpami.2023.3339628","pmid":"https://pubmed.ncbi.nlm.nih.gov/38051621"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2023.3339628","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2023.3339628","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2312.11967","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101459385","display_name":"Wei Tang","orcid":"https://orcid.org/0000-0003-3414-2421"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Tang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0003-3414-2421","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034640518","display_name":"Liang Li","orcid":"https://orcid.org/0000-0001-8437-4824"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Li","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8437-4824","affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101944061","display_name":"Xuejing Liu","orcid":"https://orcid.org/0000-0001-9612-3707"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuejing Liu","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9612-3707","affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101923561","display_name":"Lu Jin","orcid":"https://orcid.org/0000-0002-2964-426X"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Jin","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-2964-426X","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035112538","display_name":"Jinhui Tang","orcid":"https://orcid.org/0000-0001-9008-222X"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinhui Tang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-9008-222X","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017096005","display_name":"Zechao Li","orcid":"https://orcid.org/0000-0002-5341-5985"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zechao Li","raw_affiliation_strings":["School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0002-5341-5985","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, No. 200 Xiaolingwei Road, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.3929,"has_fulltext":true,"cited_by_count":41,"citation_normalized_percentile":{"value":0.95955041,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"46","issue":"5","first_page":"3213","last_page":"3229"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8161464929580688},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6792707443237305},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.584380030632019},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5767282247543335},{"id":"https://openalex.org/keywords/referent","display_name":"Referent","score":0.46923404932022095},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.46624818444252014},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.45875099301338196},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4501417279243469},{"id":"https://openalex.org/keywords/scene-statistics","display_name":"Scene statistics","score":0.43451449275016785},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43137457966804504},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.41916632652282715},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3549102246761322},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3538687825202942}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8161464929580688},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6792707443237305},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.584380030632019},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5767282247543335},{"id":"https://openalex.org/C2777096784","wikidata":"https://www.wikidata.org/wiki/Q3826351","display_name":"Referent","level":2,"score":0.46923404932022095},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.46624818444252014},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.45875099301338196},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4501417279243469},{"id":"https://openalex.org/C197654239","wikidata":"https://www.wikidata.org/wiki/Q7430757","display_name":"Scene statistics","level":3,"score":0.43451449275016785},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43137457966804504},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.41916632652282715},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3549102246761322},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3538687825202942},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tpami.2023.3339628","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2023.3339628","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:38051621","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38051621","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null},{"id":"pmh:oai:arXiv.org:2312.11967","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.11967","pdf_url":"https://arxiv.org/pdf/2312.11967","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2312.11967","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.11967","pdf_url":"https://arxiv.org/pdf/2312.11967","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6800000071525574}],"awards":[{"id":"https://openalex.org/G4262806985","display_name":null,"funder_award_id":"2022ZD0118802","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G4536128632","display_name":null,"funder_award_id":"62322211","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5710919167","display_name":null,"funder_award_id":"62102181","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7975452587","display_name":null,"funder_award_id":"U20B2064","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335892","display_name":"Youth Innovation Promotion Association","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4389352357.pdf","grobid_xml":"https://content.openalex.org/works/W4389352357.grobid-xml"},"referenced_works_count":84,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2081357526","https://openalex.org/W2251512949","https://openalex.org/W2277195237","https://openalex.org/W2547411571","https://openalex.org/W2558535589","https://openalex.org/W2568262903","https://openalex.org/W2570343428","https://openalex.org/W2583360688","https://openalex.org/W2606473278","https://openalex.org/W2752796333","https://openalex.org/W2770129969","https://openalex.org/W2799263800","https://openalex.org/W2832876791","https://openalex.org/W2904910963","https://openalex.org/W2946086442","https://openalex.org/W2949693283","https://openalex.org/W2960655175","https://openalex.org/W2962764817","https://openalex.org/W2963109634","https://openalex.org/W2963518342","https://openalex.org/W2963735856","https://openalex.org/W2963783181","https://openalex.org/W2963799213","https://openalex.org/W2964022527","https://openalex.org/W2964284374","https://openalex.org/W2964345792","https://openalex.org/W2966715458","https://openalex.org/W2969876226","https://openalex.org/W2984121207","https://openalex.org/W2986755220","https://openalex.org/W2986803748","https://openalex.org/W2987401211","https://openalex.org/W2987734933","https://openalex.org/W2998631105","https://openalex.org/W3033910970","https://openalex.org/W3034772468","https://openalex.org/W3035097537","https://openalex.org/W3035258717","https://openalex.org/W3035268124","https://openalex.org/W3087365719","https://openalex.org/W3091588028","https://openalex.org/W3092900959","https://openalex.org/W3093306589","https://openalex.org/W3096609285","https://openalex.org/W3109644378","https://openalex.org/W3110435696","https://openalex.org/W3119641295","https://openalex.org/W3156506295","https://openalex.org/W3159619744","https://openalex.org/W3163747765","https://openalex.org/W3171547673","https://openalex.org/W3172522282","https://openalex.org/W3173364567","https://openalex.org/W3173859428","https://openalex.org/W3174004334","https://openalex.org/W3174476431","https://openalex.org/W3182736162","https://openalex.org/W3184784418","https://openalex.org/W3202473058","https://openalex.org/W4214490042","https://openalex.org/W4225517085","https://openalex.org/W4225641084","https://openalex.org/W4247698036","https://openalex.org/W4280538209","https://openalex.org/W4281633595","https://openalex.org/W4283688199","https://openalex.org/W4283805152","https://openalex.org/W4287183620","https://openalex.org/W4287672528","https://openalex.org/W4289126595","https://openalex.org/W4301418420","https://openalex.org/W4309181071","https://openalex.org/W4312649925","https://openalex.org/W4313068342","https://openalex.org/W4313145013","https://openalex.org/W4320086030","https://openalex.org/W4392159830","https://openalex.org/W6757135208","https://openalex.org/W6766904570","https://openalex.org/W6767211374","https://openalex.org/W6797397777","https://openalex.org/W6839015040","https://openalex.org/W6849654190"],"related_works":["https://openalex.org/W2143938773","https://openalex.org/W2366781357","https://openalex.org/W2493878481","https://openalex.org/W1968508462","https://openalex.org/W2167817468","https://openalex.org/W97399927","https://openalex.org/W2145850538","https://openalex.org/W2900482274","https://openalex.org/W2145315825","https://openalex.org/W2024163894"],"abstract_inverted_index":{"Visual":[0],"grounding":[1,88],"(VG)":[2],"aims":[3],"to":[4,67,89,125,152,173],"locate":[5],"a":[6,14,76,122,168,174],"specific":[7],"target":[8,28],"in":[9,203],"an":[10],"image":[11],"based":[12],"on":[13,144,186],"given":[15],"language":[16],"query.":[17],"The":[18,109,136,192],"discriminative":[19],"information":[20],"from":[21,29,116],"context":[22,80,95,101],"is":[23],"important":[24],"for":[25,33,55,85,132,178],"distinguishing":[26],"the":[27,34,38,56,68,94,98,113,117,128,133,156,159,200],"other":[30],"objects,":[31],"particularly":[32],"targets":[35],"that":[36,196],"have":[37],"same":[39],"category":[40],"as":[41],"others.":[42],"However,":[43],"most":[44],"previous":[45],"methods":[46,202],"underestimate":[47],"such":[48],"information.":[49],"Moreover,":[50],"they":[51],"are":[52,164,184],"usually":[53],"designed":[54],"standard":[57,188],"scene":[58],"(without":[59],"any":[60],"novel":[61,77],"object),":[62],"which":[63,103],"limits":[64],"their":[65],"generalization":[66],"open-vocabulary":[69,134,190],"scene.":[70,135],"In":[71],"this":[72],"paper,":[73],"we":[74],"propose":[75],"framework":[78],"with":[79,167],"disentangling":[81,96],"and":[82,100,147,171,189],"prototype":[83,110,123],"inheriting":[84,111],"robust":[86],"visual":[87,119,148],"handle":[90],"both":[91,187,204],"scenes.":[92,191],"Specifically,":[93],"disentangles":[97],"referent":[99],"features,":[102,138,163],"achieves":[104],"better":[105],"discrimination":[106],"between":[107,158],"them.":[108],"inherits":[112],"prototypes":[114,151],"discovered":[115],"disentangled":[118,145],"features":[120,149],"by":[121,140],"bank":[124],"fully":[126],"utilize":[127],"seen":[129],"data,":[130],"especially":[131],"fused":[137],"obtained":[139],"leveraging":[141],"Hadamard":[142],"product":[143],"linguistic":[146],"of":[150,162],"avoid":[153],"sharp":[154],"adjusting":[155],"importance":[157],"two":[160],"types":[161],"then":[165],"attached":[166],"special":[169],"token":[170],"feed":[172],"vision":[175],"Transformer":[176],"encoder":[177],"bounding":[179],"box":[180],"regression.":[181],"Extensive":[182],"experiments":[183],"conducted":[185],"performance":[193],"comparisons":[194],"indicate":[195],"our":[197],"method":[198],"outperforms":[199],"state-of-the-art":[201],"scenarios.":[205]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":22},{"year":2024,"cited_by_count":13}],"updated_date":"2026-07-02T09:51:11.867554","created_date":"2025-10-10T00:00:00"}
