{"id":"https://openalex.org/W4402218496","doi":"https://doi.org/10.1109/agro-geoinformatics262780.2024.10660703","title":"CMMSNet:A Multi-modal Semantic Segmentation Network for Rooftop Extraction based on SAR and Optical Images","display_name":"CMMSNet:A Multi-modal Semantic Segmentation Network for Rooftop Extraction based on SAR and Optical Images","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4402218496","doi":"https://doi.org/10.1109/agro-geoinformatics262780.2024.10660703"},"language":"en","primary_location":{"id":"doi:10.1109/agro-geoinformatics262780.2024.10660703","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/agro-geoinformatics262780.2024.10660703","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 12th International Conference on Agro-Geoinformatics (Agro-Geoinformatics)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102816890","display_name":"Zhengwei Shen","orcid":"https://orcid.org/0000-0001-7816-5081"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]},{"id":"https://openalex.org/I4210132079","display_name":"Hangzhou Wanxiang Polytechnic","ror":"https://ror.org/03sxnxp24","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210132079"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhengwei Shen","raw_affiliation_strings":["Polytechnic Institute, Zhejiang University,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"Polytechnic Institute, Zhejiang University,Hangzhou,China","institution_ids":["https://openalex.org/I4210132079","https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010234425","display_name":"Yongheng Shang","orcid":"https://orcid.org/0000-0001-8550-6710"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongheng Shang","raw_affiliation_strings":["Zhejiang University,College of Computer Science,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Computer Science,Hangzhou,China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054062261","display_name":"Xiaoyu Zhang","orcid":"https://orcid.org/0000-0002-7270-7270"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyu Zhang","raw_affiliation_strings":["Zhejiang University,School of Earth Sciences,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,School of Earth Sciences,Hangzhou,China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069353502","display_name":"Jianwei Yin","orcid":"https://orcid.org/0000-0003-4703-7348"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianwei Yin","raw_affiliation_strings":["Zhejiang University,College of Computer Science,Hangzhou,China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Computer Science,Hangzhou,China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102740397","display_name":"Jun Han","orcid":"https://orcid.org/0000-0002-8606-7657"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jun Han","raw_affiliation_strings":["State Grid Jiangsu Economic Research Institute,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"State Grid Jiangsu Economic Research Institute,Nanjing,China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101693641","display_name":"Chao Cai","orcid":"https://orcid.org/0000-0001-8388-7628"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chao Cai","raw_affiliation_strings":["State Grid Jiangsu Economic Research Institute,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"State Grid Jiangsu Economic Research Institute,Nanjing,China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102816890"],"corresponding_institution_ids":["https://openalex.org/I4210132079","https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.2501,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.52099566,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9688000082969666,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9688000082969666,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12364","display_name":"Archaeological Research and Protection","score":0.9573000073432922,"subfield":{"id":"https://openalex.org/subfields/1912","display_name":"Space and Planetary Science"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.934499979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.751764714717865},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7462847232818604},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6172970533370972},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.578472375869751},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5123413801193237},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.5072324275970459},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4421318769454956},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4220360815525055},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34625372290611267},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.06732416152954102}],"concepts":[{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.751764714717865},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7462847232818604},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6172970533370972},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.578472375869751},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5123413801193237},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.5072324275970459},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4421318769454956},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4220360815525055},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34625372290611267},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.06732416152954102},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/agro-geoinformatics262780.2024.10660703","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/agro-geoinformatics262780.2024.10660703","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 12th International Conference on Agro-Geoinformatics (Agro-Geoinformatics)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320326707","display_name":"State Grid Corporation of China","ror":"https://ror.org/05twwhs70"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2117539524","https://openalex.org/W2164943005","https://openalex.org/W2194775991","https://openalex.org/W2560023338","https://openalex.org/W2630837129","https://openalex.org/W2752782242","https://openalex.org/W2771517259","https://openalex.org/W3010622813","https://openalex.org/W4200142374","https://openalex.org/W4200556575","https://openalex.org/W4229058281","https://openalex.org/W4310582166","https://openalex.org/W4322707648","https://openalex.org/W4362465310","https://openalex.org/W4362465355","https://openalex.org/W4362703933","https://openalex.org/W6739696289","https://openalex.org/W6748481559"],"related_works":["https://openalex.org/W2379392295","https://openalex.org/W3160965418","https://openalex.org/W4379231730","https://openalex.org/W613940353","https://openalex.org/W2320915480","https://openalex.org/W4389858081","https://openalex.org/W2362990116","https://openalex.org/W2381300099","https://openalex.org/W2377297411","https://openalex.org/W1522196789"],"abstract_inverted_index":{"Distributed":[0],"rooftop":[1,369],"photovoltaic":[2],"systems":[3],"hold":[4],"immense":[5],"potential":[6],"for":[7,24,121,232,364,401],"renewable":[8],"energy":[9],"generation,":[10],"and":[11,68,147,169,184,222,236,260,285,294,317,350,355,397],"accurate":[12],"extraction":[13,139,366],"of":[14,83,103,128,188,242,296,327,367,373,383],"building":[15,122,368],"roofs":[16],"from":[17,57,167,218,264],"high-resolution":[18],"remote":[19,197,375,393],"sensing":[20,198,376,394],"imagery":[21],"is":[22,130,177,207,230,254],"crucial":[23,231],"their":[25],"development.":[26],"While":[27],"current":[28],"semantic":[29,116,182,344],"segmentation":[30,50,117,323,345],"methods":[31,77,346],"primarily":[32],"rely":[33,73],"on":[34,74,331],"single-modality":[35],"optical":[36,69,170,318],"images,":[37,70,319],"Synthetic":[38],"Aperture":[39],"Radar":[40],"(SAR)":[41],"offers":[42],"complementary":[43,81,104,312],"ground":[44],"information":[45,82,89,213,313],"that":[46,336],"can":[47],"significantly":[48],"enhance":[49],"accuracy.":[51],"However,":[52],"the":[53,80,87,91,137,142,148,186,215,224,239,292,300,311,321,332,365,371,381],"modality":[54,144,149,284],"disparities":[55],"arising":[56],"different":[58,92,194],"imaging":[59],"mechanisms":[60],"pose":[61],"challenges":[62,391],"in":[63,99,196,237,347,388,392,404],"feature":[64,95,138,165,240],"fusion":[65,76,115,150,295,387],"between":[66,90,214],"SAR":[67,168,316],"existing":[71,342],"approaches":[72],"simplistic":[75],"to":[78,162,179,256,282,309],"exploit":[79],"each":[84,243,283],"modality,":[85],"ignoring":[86],"correlative":[88,212],"modalities":[93,217],"during":[94],"extraction,":[96],"this":[97,175,228,267,405],"results":[98],"an":[100,201],"insufficient":[101],"integration":[102],"information.To":[105],"address":[106,185],"these":[107],"challenges,":[108],"we":[109],"introduce":[110],"CMMSNet,":[111],"a":[112,219,247,270,361],"novel":[113],"multi-modal":[114,261,356,374,385],"network":[118],"specifically":[119],"designed":[120,255],"roof":[123],"extraction.":[124],"The":[125],"main":[126],"architecture":[127],"CMMSNet":[129,161,339],"constituted":[131],"by":[132,160,279,315],"three":[133,134],"core":[135],"modules:":[136],"encoder":[140],"module,":[141,146],"heterogeneous":[143,262],"alignment":[145],"decoder":[151],"module.":[152],"Initially,":[153],"dual":[154],"independent":[155],"pyramid-structured":[156],"encoders":[157],"are":[158],"employed":[159],"separately":[163],"extract":[164],"pyramids":[166],"images":[171],"at":[172],"various":[173],"scales,":[174],"strategy":[176],"intended":[178],"capture":[180],"multi-scale":[181,259],"contexts":[183],"issue":[187],"large":[189],"spatial":[190,220],"scale":[191],"variations":[192],"among":[193],"objects":[195],"images.":[199,377],"Furthermore,":[200],"Adaptive":[202],"Feature":[203,250],"Alignment":[204],"Module":[205],"(AFAM)":[206],"introduced,":[208],"tasked":[209],"with":[210],"identifying":[211],"two":[216],"dimension":[221],"aligning":[223],"modal":[225],"features":[226,263,278,302],"accordingly,":[227],"process":[229],"facilitating":[233],"cross-modal":[234],"learning":[235],"enhancing":[238,291,320],"representation":[241],"modality.":[244],"In":[245],"addition,":[246],"Cross-Modal":[248],"Multi-Scale":[249],"Fusion":[251],"(CMMSFF)":[252],"module":[253,268],"effectively":[257],"integrates":[258],"both":[265,348,353],"modalities,":[266],"employs":[269],"channel":[271],"self-attention":[272],"mechanism,":[273],"which":[274],"adaptively":[275],"fuses":[276],"discriminative":[277],"applying":[280],"weights":[281],"selectively":[286],"discarding":[287],"irrelevant":[288],"components,":[289],"thus":[290],"selection":[293],"key":[297],"channels":[298],"within":[299],"multimodal":[301],"set.":[303],"This":[304,358],"innovative":[305],"approach":[306],"allows":[307],"us":[308],"harness":[310],"provided":[314],"overall":[322],"performance.":[324],"A":[325],"series":[326],"comprehensive":[328],"experiments":[329],"conducted":[330],"DFC23":[333],"dataset":[334],"demonstrate":[335],"our":[337],"proposed":[338],"outperforms":[340],"other":[341],"mainstream":[343],"stability":[349],"effectiveness,":[351],"including":[352],"single-modal":[354],"approaches.":[357],"achievement":[359],"sets":[360],"new":[362],"benchmark":[363],"through":[370],"use":[372],"Our":[378],"findings":[379],"highlight":[380],"importance":[382],"leveraging":[384],"data":[386],"addressing":[389],"real-world":[390],"image":[395],"analysis":[396],"offer":[398],"valuable":[399],"insights":[400],"future":[402],"research":[403],"domain.":[406]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-10-10T00:00:00"}
