{"id":"https://openalex.org/W7092293273","doi":"https://doi.org/10.1109/tcsvt.2025.3622736","title":"ChatStitch: Visualizing Through Structures via Surround-View Unsupervised Deep Image Stitching With Collaborative LLM-Agents","display_name":"ChatStitch: Visualizing Through Structures via Surround-View Unsupervised Deep Image Stitching With Collaborative LLM-Agents","publication_year":2025,"publication_date":"2025-10-17","ids":{"openalex":"https://openalex.org/W7092293273","doi":"https://doi.org/10.1109/tcsvt.2025.3622736"},"language":null,"primary_location":{"id":"doi:10.1109/tcsvt.2025.3622736","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3622736","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Hao Liang","orcid":"https://orcid.org/0000-0003-4183-3423"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Liang","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4183-3423","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhipeng Dong","orcid":"https://orcid.org/0000-0002-1706-9253"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhipeng Dong","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1706-9253","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Kaixin Chen","orcid":"https://orcid.org/0009-0004-0733-9813"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaixin Chen","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-0733-9813","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hao Li","orcid":"https://orcid.org/0009-0005-3565-501X"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Li","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-3565-501X","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiyuan Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiyuan Guo","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yufeng Yue","orcid":"https://orcid.org/0000-0001-6628-7946"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufeng Yue","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6628-7946","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Mengyin Fu","orcid":"https://orcid.org/0000-0002-5520-7127"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyin Fu","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5520-7127","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yi Yang","orcid":"https://orcid.org/0000-0003-3964-2433"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3964-2433","affiliations":[{"raw_affiliation_string":"School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.50164381,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"36","issue":"3","first_page":"3027","last_page":"3040"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6107000112533569,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6107000112533569,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.23720000684261322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.03519999980926514,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/image-stitching","display_name":"Image stitching","score":0.9692000150680542},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5335999727249146},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5085999965667725},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4410000145435333},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4097000062465668},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3292999863624573},{"id":"https://openalex.org/keywords/information-exchange","display_name":"Information exchange","score":0.3151000142097473}],"concepts":[{"id":"https://openalex.org/C29081049","wikidata":"https://www.wikidata.org/wiki/Q1364242","display_name":"Image stitching","level":2,"score":0.9692000150680542},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8083999752998352},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6467000246047974},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6308000087738037},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5335999727249146},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5085999965667725},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4410000145435333},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4097000062465668},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3292999863624573},{"id":"https://openalex.org/C189693848","wikidata":"https://www.wikidata.org/wiki/Q6031064","display_name":"Information exchange","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.31189998984336853},{"id":"https://openalex.org/C42781572","wikidata":"https://www.wikidata.org/wiki/Q1250322","display_name":"Digital image","level":4,"score":0.3019999861717224},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.30149999260902405},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.2824999988079071},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2563000023365021}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3622736","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3622736","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2565581497","display_name":null,"funder_award_id":"92370203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3511544556","display_name":null,"funder_award_id":"62233002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8750879816","display_name":null,"funder_award_id":"2022YFC2603600","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1963246386","https://openalex.org/W1979076920","https://openalex.org/W2117228865","https://openalex.org/W2126060993","https://openalex.org/W2128409098","https://openalex.org/W2144042618","https://openalex.org/W2160072137","https://openalex.org/W2194775991","https://openalex.org/W2615547864","https://openalex.org/W2786533959","https://openalex.org/W2982681137","https://openalex.org/W2996759437","https://openalex.org/W3034275286","https://openalex.org/W3035098634","https://openalex.org/W3035172746","https://openalex.org/W3035574168","https://openalex.org/W3090375251","https://openalex.org/W3095840465","https://openalex.org/W3109991383","https://openalex.org/W3144819047","https://openalex.org/W3175249881","https://openalex.org/W3175385336","https://openalex.org/W3182360346","https://openalex.org/W3204792207","https://openalex.org/W3209102426","https://openalex.org/W3214403471","https://openalex.org/W4200235160","https://openalex.org/W4205125245","https://openalex.org/W4206138072","https://openalex.org/W4221151978","https://openalex.org/W4312275356","https://openalex.org/W4312306846","https://openalex.org/W4312604822","https://openalex.org/W4312939270","https://openalex.org/W4313016521","https://openalex.org/W4323644077","https://openalex.org/W4360610393","https://openalex.org/W4385245566","https://openalex.org/W4386065691","https://openalex.org/W4386076238","https://openalex.org/W4386076483","https://openalex.org/W4386083148","https://openalex.org/W4386634496","https://openalex.org/W4390872094","https://openalex.org/W4390872473","https://openalex.org/W4390970341","https://openalex.org/W4391516317","https://openalex.org/W4392016505","https://openalex.org/W4394595621","https://openalex.org/W4401357170","https://openalex.org/W4401686180","https://openalex.org/W4402703070","https://openalex.org/W4402753889","https://openalex.org/W4402769251","https://openalex.org/W4402951584","https://openalex.org/W4403722473","https://openalex.org/W4404691764","https://openalex.org/W4408223246","https://openalex.org/W4408323594","https://openalex.org/W4410226785","https://openalex.org/W4413917866"],"related_works":[],"abstract_inverted_index":{"Surround-view":[0],"perception":[1,12,29],"has":[2],"garnered":[3],"significant":[4],"attention":[5],"for":[6,146],"its":[7],"ability":[8],"to":[9],"enhance":[10],"the":[11,19,82,118,126,143],"capabilities":[13],"of":[14,21,65,157,165],"autonomous":[15],"driving":[16],"vehicles":[17],"through":[18,71],"exchange":[20],"information":[22,70],"with":[23,39,76,154],"surrounding":[24],"cameras.":[25],"However,":[26],"existing":[27],"surround-view":[28,60,111],"systems":[30],"are":[31],"limited":[32],"by":[33],"inefficiencies":[34],"in":[35,43],"unidirectional":[36,83],"interaction":[37,84,92],"pattern":[38],"human":[40],"and":[41,131,149,160,162,168],"distortions":[42],"overlapping":[44,105],"regions":[45],"exponentially":[46],"propagating":[47],"into":[48],"non-overlapping":[49],"areas.":[50],"To":[51,80,100],"address":[52],"these":[53],"challenges,":[54],"this":[55],"paper":[56],"introduces":[57],"ChatStitch,":[58],"a":[59,88,110],"human-machine":[61],"co-perception":[62],"system":[63],"capable":[64],"unveiling":[66],"obscured":[67],"blind":[68],"spot":[69],"natural":[72],"language":[73],"commands":[74],"integrated":[75],"external":[77],"digital":[78],"assets.":[79],"dismantle":[81],"bottleneck,":[85],"ChatStitch":[86,107],"implements":[87],"cognitively":[89],"grounded":[90],"closed-loop":[91],"multi-agent":[93],"framework":[94],"based":[95],"on":[96,125,142],"Large":[97],"Language":[98],"Models.":[99],"suppress":[101],"distortion":[102],"propagation":[103],"across":[104],"boundaries,":[106],"proposes":[108],"SV-UDIS,":[109],"unsupervised":[112],"deep":[113],"image":[114,151],"stitching":[115,152],"method":[116,138],"under":[117],"non-global-overlapping":[119],"condition.":[120],"We":[121],"conducted":[122],"extensive":[123],"experiments":[124],"UDIS-D,":[127],"MCOV-SLAM":[128],"open":[129],"datasets,":[130],"our":[132,136],"real-world":[133],"dataset.":[134],"Specifically,":[135],"SV-UDIS":[137],"achieves":[139],"state-of-the-art":[140],"performance":[141],"UDIS-D":[144],"dataset":[145],"3,":[147],"4,":[148],"5":[150],"tasks,":[153],"PSNR":[155],"improvements":[156,164],"9%,":[158],"17%,":[159],"21%,":[161],"SSIM":[163],"8%,":[166],"18%,":[167],"26%,":[169],"respectively.":[170],"The":[171],"code":[172],"is":[173],"available":[174],"at":[175],"https://github.com/lhlawrence/ChatStitch.":[176]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-18T00:00:00"}
