{"id":"https://openalex.org/W4366996284","doi":"https://doi.org/10.1109/tip.2023.3268004","title":"Viewpoint-Adaptive Representation Disentanglement Network for Change Captioning","display_name":"Viewpoint-Adaptive Representation Disentanglement Network for Change Captioning","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4366996284","doi":"https://doi.org/10.1109/tip.2023.3268004","pmid":"https://pubmed.ncbi.nlm.nih.gov/37097800"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2023.3268004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2023.3268004","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021557044","display_name":"Yunbin Tu","orcid":"https://orcid.org/0000-0002-9525-9060"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunbin Tu","raw_affiliation_strings":["School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034640518","display_name":"Liang Li","orcid":"https://orcid.org/0000-0001-8437-4824"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Li","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","Lishui Institute of Hangzhou Dianzi University, Lishui, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Lishui Institute of Hangzhou Dianzi University, Lishui, Zhejiang, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088659027","display_name":"Li Su","orcid":"https://orcid.org/0000-0003-4038-753X"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Su","raw_affiliation_strings":["School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100663187","display_name":"Junping Du","orcid":"https://orcid.org/0000-0001-8590-3767"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junping Du","raw_affiliation_strings":["School of Computer Science and Technology, Beijing University of Posts and Telecommunications, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072833759","display_name":"Ke L\u00fc","orcid":"https://orcid.org/0000-0003-0176-3088"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Lu","raw_affiliation_strings":["School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","Peng Cheng Laboratory, Nanshan, Shenzhen, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"School of Engineering Science, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Peng Cheng Laboratory, Nanshan, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028597017","display_name":"Qingming Huang","orcid":"https://orcid.org/0000-0001-7542-296X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingming Huang","raw_affiliation_strings":["School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5021557044"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":4.333,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.95746155,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"32","issue":null,"first_page":"2620","last_page":"2635"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9818000197410583,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.835423469543457},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7581848502159119},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6915349960327148},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5868505239486694},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.544405460357666},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5297946333885193},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4497796595096588},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4253332018852234},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36050355434417725},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.35788851976394653},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.23294037580490112},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.19640865921974182}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.835423469543457},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7581848502159119},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6915349960327148},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5868505239486694},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.544405460357666},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5297946333885193},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4497796595096588},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4253332018852234},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36050355434417725},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35788851976394653},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.23294037580490112},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.19640865921974182},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2023.3268004","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2023.3268004","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:37097800","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37097800","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.5400000214576721,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1108969597","display_name":null,"funder_award_id":"62192784","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1520374204","display_name":null,"funder_award_id":"U22B2038","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2092942873","display_name":null,"funder_award_id":"2018YFE0303104","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G2446480051","display_name":null,"funder_award_id":"2020108","funder_id":"https://openalex.org/F4320321133","funder_display_name":"Chinese Academy of Sciences"},{"id":"https://openalex.org/G2973092727","display_name":null,"funder_award_id":"62032022","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4199693610","display_name":null,"funder_award_id":"62236008","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6212863906","display_name":null,"funder_award_id":"U21B2038","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7801426869","display_name":null,"funder_award_id":"61931008","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1889081078","https://openalex.org/W1894683164","https://openalex.org/W1956340063","https://openalex.org/W2068228981","https://openalex.org/W2101105183","https://openalex.org/W2123301721","https://openalex.org/W2154652894","https://openalex.org/W2194775991","https://openalex.org/W2506483933","https://openalex.org/W2531409750","https://openalex.org/W2745461083","https://openalex.org/W2765658575","https://openalex.org/W2896457183","https://openalex.org/W2905544595","https://openalex.org/W2949554687","https://openalex.org/W2953461088","https://openalex.org/W2964196083","https://openalex.org/W2970927600","https://openalex.org/W2988981892","https://openalex.org/W3016796243","https://openalex.org/W3033043020","https://openalex.org/W3034682719","https://openalex.org/W3093309253","https://openalex.org/W3094171276","https://openalex.org/W3096808073","https://openalex.org/W3108170342","https://openalex.org/W3110074314","https://openalex.org/W3139049060","https://openalex.org/W3140300848","https://openalex.org/W3159583533","https://openalex.org/W3175933895","https://openalex.org/W3176470992","https://openalex.org/W3177048142","https://openalex.org/W3203526456","https://openalex.org/W4205844428","https://openalex.org/W4206621053","https://openalex.org/W4213455776","https://openalex.org/W4220790454","https://openalex.org/W4220863475","https://openalex.org/W4220974521","https://openalex.org/W4225739172","https://openalex.org/W4283271696","https://openalex.org/W4295312788","https://openalex.org/W4297779827","https://openalex.org/W4309938607","https://openalex.org/W4313007769","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6639432524","https://openalex.org/W6678262379","https://openalex.org/W6682631176","https://openalex.org/W6725318829","https://openalex.org/W6739901393","https://openalex.org/W6766978945","https://openalex.org/W6767194493","https://openalex.org/W6771497439","https://openalex.org/W6780226713","https://openalex.org/W6792695861","https://openalex.org/W6797360341","https://openalex.org/W6802779907"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W1968289971","https://openalex.org/W4300588357"],"abstract_inverted_index":{"Change":[0],"captioning":[1],"is":[2,80,122,154],"to":[3,31,58,71,82,88,124],"describe":[4],"the":[5,21,32,38,44,67,84,93,128,132,140,144,148],"fine-grained":[6],"change":[7,46,70,109],"between":[8,131],"a":[9,53,76,107,114],"pair":[10],"of":[11,69,96],"images.":[12],"The":[13,152],"pseudo":[14,62],"changes":[15,19,90],"caused":[16],"by":[17],"viewpoint":[18,89],"are":[20],"most":[22],"typical":[23],"distractors":[24],"in":[25,86],"this":[26,49],"task,":[27],"because":[28],"they":[29],"lead":[30],"feature":[33],"perturbation":[34],"and":[35,41,61,64,100,126],"shift":[36],"for":[37,111],"same":[39],"objects":[40],"thus":[42],"overwhelm":[43],"real":[45,60],"representation.":[47],"In":[48],"paper,":[50],"we":[51],"propose":[52],"viewpoint-adaptive":[54],"representation":[55,78,110,120],"disentanglement":[56,121],"network":[57],"distinguish":[59],"changes,":[63],"explicitly":[65],"capture":[66],"features":[68,130],"generate":[72],"accurate":[73],"captions.":[74],"Concretely,":[75],"position-embedded":[77,134],"learning":[79],"devised":[81],"facilitate":[83],"model":[85],"adapting":[87],"via":[91],"mining":[92],"intrinsic":[94],"properties":[95],"two":[97,133],"image":[98],"representations":[99],"modeling":[101],"their":[102],"position":[103],"information.":[104],"To":[105],"learn":[106],"reliable":[108],"decoding":[112],"into":[113],"natural":[115],"language":[116],"sentence,":[117],"an":[118],"unchanged":[119,129],"designed":[123],"identify":[125],"disentangle":[127],"representations.":[135],"Extensive":[136],"experiments":[137],"show":[138],"that":[139],"proposed":[141],"method":[142],"achieves":[143],"state-of-the-art":[145],"performance":[146],"on":[147],"four":[149],"public":[150],"datasets.":[151],"code":[153],"available":[155],"at":[156],"https://github.com/tuyunbin/VARD.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
