{"id":"https://openalex.org/W3036594286","doi":"https://doi.org/10.1109/lra.2020.3003290","title":"3D-Aware Scene Change Captioning From Multiview Images","display_name":"3D-Aware Scene Change Captioning From Multiview Images","publication_year":2020,"publication_date":"2020-06-18","ids":{"openalex":"https://openalex.org/W3036594286","doi":"https://doi.org/10.1109/lra.2020.3003290","mag":"3036594286"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2020.3003290","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2020.3003290","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029961156","display_name":"Yue Qiu","orcid":"https://orcid.org/0000-0002-2181-9475"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]},{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yue Qiu","raw_affiliation_strings":["Graduate School of Systems and Information Engineering, University of Tsukuba, Tsukuba, Japan","National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Systems and Information Engineering, University of Tsukuba, Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]},{"raw_affiliation_string":"National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043995369","display_name":"Yutaka Satoh","orcid":"https://orcid.org/0000-0002-0638-0855"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]},{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yutaka Satoh","raw_affiliation_strings":["Graduate School of Systems and Information Engineering, University of Tsukuba, Tsukuba, Japan","National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Systems and Information Engineering, University of Tsukuba, Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]},{"raw_affiliation_string":"National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101490361","display_name":"Ryota Suzuki","orcid":"https://orcid.org/0000-0003-2156-844X"},"institutions":[{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Ryota Suzuki","raw_affiliation_strings":["Hirokatsu Kataoka are with the National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"Hirokatsu Kataoka are with the National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060846465","display_name":"Kenji Iwata","orcid":"https://orcid.org/0000-0001-6609-8221"},"institutions":[{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kenji Iwata","raw_affiliation_strings":["Hirokatsu Kataoka are with the National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"Hirokatsu Kataoka are with the National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan","institution_ids":["https://openalex.org/I73613424"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011507481","display_name":"Hirokatsu Kataoka","orcid":"https://orcid.org/0000-0001-8844-165X"},"institutions":[{"id":"https://openalex.org/I73613424","display_name":"National Institute of Advanced Industrial Science and Technology","ror":"https://ror.org/01703db54","country_code":"JP","type":"government","lineage":["https://openalex.org/I73613424"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hirokatsu Kataoka","raw_affiliation_strings":["Hirokatsu Kataoka are with the National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"Hirokatsu Kataoka are with the National Institute of Advanced Industrial Science and Technology (AIST), Tsukuba, Japan","institution_ids":["https://openalex.org/I73613424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5029961156"],"corresponding_institution_ids":["https://openalex.org/I146399215","https://openalex.org/I73613424"],"apc_list":null,"apc_paid":null,"fwci":1.8642,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.87967088,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"5","issue":"3","first_page":"4743","last_page":"4750"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8192086219787598},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.7985068559646606},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7749946117401123},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6971123814582825},{"id":"https://openalex.org/keywords/viewpoints","display_name":"Viewpoints","score":0.6856054067611694},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6202346086502075},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5829415917396545},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.5698825716972351},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.4616279900074005},{"id":"https://openalex.org/keywords/change-detection","display_name":"Change detection","score":0.4178951680660248},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.34159278869628906},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.1183384358882904}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8192086219787598},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.7985068559646606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7749946117401123},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6971123814582825},{"id":"https://openalex.org/C2776035091","wikidata":"https://www.wikidata.org/wiki/Q7928819","display_name":"Viewpoints","level":2,"score":0.6856054067611694},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6202346086502075},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5829415917396545},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.5698825716972351},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.4616279900074005},{"id":"https://openalex.org/C203595873","wikidata":"https://www.wikidata.org/wiki/Q25389927","display_name":"Change detection","level":2,"score":0.4178951680660248},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.34159278869628906},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.1183384358882904},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2020.3003290","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2020.3003290","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5299999713897705}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1505952289","https://openalex.org/W1514535095","https://openalex.org/W2005756025","https://openalex.org/W2077069816","https://openalex.org/W2077193177","https://openalex.org/W2101105183","https://openalex.org/W2108501770","https://openalex.org/W2112073811","https://openalex.org/W2133459682","https://openalex.org/W2154652894","https://openalex.org/W2168986765","https://openalex.org/W2194775991","https://openalex.org/W2292575701","https://openalex.org/W2317688867","https://openalex.org/W2506483933","https://openalex.org/W2559882727","https://openalex.org/W2560609797","https://openalex.org/W2561715562","https://openalex.org/W2745461083","https://openalex.org/W2774991885","https://openalex.org/W2793217313","https://openalex.org/W2808492412","https://openalex.org/W2950697717","https://openalex.org/W2963121255","https://openalex.org/W2963182550","https://openalex.org/W2963727135","https://openalex.org/W2964196083","https://openalex.org/W2971278627","https://openalex.org/W2988981892","https://openalex.org/W3011284655","https://openalex.org/W4231002530","https://openalex.org/W6630875275","https://openalex.org/W6675944832","https://openalex.org/W6682631176","https://openalex.org/W6739778489","https://openalex.org/W6746518932","https://openalex.org/W6746909395","https://openalex.org/W6763422710","https://openalex.org/W6763480078"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2385368906","https://openalex.org/W3088136942","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W4290852288","https://openalex.org/W4388893791","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314"],"abstract_inverted_index":{"In":[0,167],"this":[1],"letter,":[2],"we":[3,98],"propose":[4,99],"a":[5,15,35,43,100,155,198,210],"framework":[6,101,208],"that":[7,12,32,102,145],"recognizes":[8],"and":[9,29,69,109,135,163,182,213],"describes":[10,110],"changes":[11,31],"occur":[13],"in":[14,21,34,42,91,158,197],"scene":[16,37,64,105,112],"observed":[17],"from":[18,73,106],"multiple":[19,107],"viewpoints":[20,108],"natural":[22],"language":[23],"text.":[24],"The":[25,142],"ability":[26,80],"to":[27,81,174,178,209],"recognize":[28,68],"describe":[30],"occurred":[33],"3D":[36,52,61,121,133],"plays":[38],"an":[39,116],"essential":[40],"role":[41],"variety":[44],"of":[45,118,123,131,160,205],"human-robot":[46],"interaction":[47],"applications.":[48],"However,":[49],"most":[50],"current":[51],"vision":[53],"studies":[54],"have":[55,78],"focused":[56],"on":[57,115],"understanding":[58,117,165],"the":[59,111,119,149,179,203],"static":[60],"scene.":[62],"Existing":[63],"change":[65,71,113,164],"captioning":[66],"approaches":[67],"generate":[70],"captions":[72],"single-view":[74],"images.":[75],"Those":[76],"methods":[77],"limited":[79],"deal":[82],"with":[83,188],"camera":[84,175],"movement,":[85],"object":[86,134,138],"occlusion,":[87],"which":[88,201],"are":[89],"common":[90],"real-world":[92],"settings.":[93],"To":[94],"resolve":[95],"these":[96],"problems,":[97],"observes":[103],"every":[104],"based":[114],"underlying":[120],"structure":[122],"scenes.":[124],"We":[125],"build":[126],"three":[127],"synthetic":[128],"datasets":[129],"consisting":[130],"primitive":[132],"scanned":[136],"real":[137],"models":[139],"for":[140,186],"evaluation.":[141],"results":[143,196],"indicate":[144],"our":[146,169,191,207],"method":[147,153,170,181,192],"outperforms":[148],"previous":[150,180],"state-of-the-art":[151],"2D-based":[152],"by":[154],"large":[156],"margin":[157],"terms":[159],"sentence":[161],"generation":[162],"correctness.":[166],"addition,":[168],"is":[171],"more":[172,211],"robust":[173],"movements":[176],"compared":[177],"also":[183,193],"performs":[184],"better":[185],"scenes":[187],"occlusions.":[189],"Moreover,":[190],"shows":[194],"encouraging":[195],"realistic":[199],"scene-setting,":[200],"indicates":[202],"possibility":[204],"adapting":[206],"complicated":[212],"extensive":[214],"scene-settings.":[215]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
