{"id":"https://openalex.org/W4405785392","doi":"https://doi.org/10.1109/iros58592.2024.10801872","title":"Efficient Multimodal Semantic Segmentation via Dual-Prompt Learning","display_name":"Efficient Multimodal Semantic Segmentation via Dual-Prompt Learning","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405785392","doi":"https://doi.org/10.1109/iros58592.2024.10801872"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10801872","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801872","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100630430","display_name":"Shaohua Dong","orcid":"https://orcid.org/0009-0008-2685-6217"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shaohua Dong","raw_affiliation_strings":["University of North Texas,Dept. of Computer Science and Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Dept. of Computer Science and Engineering","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073748933","display_name":"Yunhe Feng","orcid":"https://orcid.org/0000-0001-6577-227X"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yunhe Feng","raw_affiliation_strings":["University of North Texas,Dept. of Computer Science and Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Dept. of Computer Science and Engineering","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102751945","display_name":"Qing Yang","orcid":"https://orcid.org/0000-0003-3495-370X"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qing Yang","raw_affiliation_strings":["University of North Texas,Dept. of Computer Science and Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Dept. of Computer Science and Engineering","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100764456","display_name":"Yan Huang","orcid":"https://orcid.org/0000-0002-0575-0156"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yan Huang","raw_affiliation_strings":["University of North Texas,Dept. of Computer Science and Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Dept. of Computer Science and Engineering","institution_ids":["https://openalex.org/I123534392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101979289","display_name":"Dongfang Liu","orcid":"https://orcid.org/0000-0001-6995-4775"},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dongfang Liu","raw_affiliation_strings":["Rochester Institute of Technology,Dept. of Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Rochester Institute of Technology,Dept. of Engineering","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047220188","display_name":"Heng Fan","orcid":"https://orcid.org/0000-0002-7033-3690"},"institutions":[{"id":"https://openalex.org/I123534392","display_name":"University of North Texas","ror":"https://ror.org/00v97ad02","country_code":"US","type":"education","lineage":["https://openalex.org/I123534392"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Heng Fan","raw_affiliation_strings":["University of North Texas,Dept. of Computer Science and Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of North Texas,Dept. of Computer Science and Engineering","institution_ids":["https://openalex.org/I123534392"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":7.3312,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.97599906,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"14196","last_page":"14203"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.8989999890327454,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.8989999890327454,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.7822999954223633,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.7588000297546387,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7822355031967163},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.5489296913146973},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5386495590209961},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5300830602645874},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4476100206375122},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.05792680382728577}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7822355031967163},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.5489296913146973},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5386495590209961},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5300830602645874},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4476100206375122},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.05792680382728577},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros58592.2024.10801872","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10801872","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W20683899","https://openalex.org/W125693051","https://openalex.org/W1903029394","https://openalex.org/W1923184257","https://openalex.org/W1966025376","https://openalex.org/W1976409045","https://openalex.org/W1982075130","https://openalex.org/W1994922096","https://openalex.org/W2039298799","https://openalex.org/W2194775991","https://openalex.org/W2774839435","https://openalex.org/W2887486131","https://openalex.org/W2921749009","https://openalex.org/W2939217524","https://openalex.org/W2945809413","https://openalex.org/W2963529609","https://openalex.org/W2963543249","https://openalex.org/W2963868681","https://openalex.org/W2971014764","https://openalex.org/W2995936506","https://openalex.org/W3015871565","https://openalex.org/W3034320133","https://openalex.org/W3035687312","https://openalex.org/W3039479109","https://openalex.org/W3091001089","https://openalex.org/W3097053213","https://openalex.org/W3106587394","https://openalex.org/W3108601100","https://openalex.org/W3108608656","https://openalex.org/W3120875261","https://openalex.org/W3131500599","https://openalex.org/W3166016280","https://openalex.org/W3174770825","https://openalex.org/W3194841206","https://openalex.org/W3198062544","https://openalex.org/W4200635035","https://openalex.org/W4205991051","https://openalex.org/W4225487034","https://openalex.org/W4304098539","https://openalex.org/W4312242472","https://openalex.org/W4312372834","https://openalex.org/W4312651322","https://openalex.org/W4312685069","https://openalex.org/W4313142416","https://openalex.org/W4319879007","https://openalex.org/W4386065698","https://openalex.org/W4386071619","https://openalex.org/W4386071848","https://openalex.org/W4386075647","https://openalex.org/W4386179772","https://openalex.org/W4386275800","https://openalex.org/W4390873881","https://openalex.org/W6765983947","https://openalex.org/W6779094306","https://openalex.org/W6784333009","https://openalex.org/W6796581206","https://openalex.org/W6797399245","https://openalex.org/W6798837711","https://openalex.org/W6809808896","https://openalex.org/W6838701581","https://openalex.org/W6842407414","https://openalex.org/W6856738047","https://openalex.org/W6857058839"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Multimodal":[0],"(e.g.,":[1,15,71],"RGB-Depth/RGB-Thermal)":[2],"fusion":[3,31,188],"has":[4],"shown":[5],"great":[6],"potential":[7],"for":[8,33,68,158,185],"improving":[9],"semantic":[10,36,73,90,161,214],"segmentation":[11,215,232],"in":[12,47,123,154],"complex":[13,209],"scenes":[14],"indoor/low-light":[16],"conditions).":[17],"Existing":[18],"approaches":[19,210],"often":[20],"fully":[21],"fine-tune":[22],"a":[23,28,58,83,124,172,192,205],"dual-branch":[24],"encoder-decoder":[25],"framework":[26],"with":[27,207],"complicated":[29,240],"feature":[30,48,111,187],"strategy":[32],"achieving":[34],"multimodal":[35,70,89,105,110,139,152,160,186,231],"segmentation,":[37,91],"which":[38],"is":[39,79,128,203,225],"training-costly":[40],"due":[41],"to":[42,80,88,116,132,135,229],"the":[43,118,137,145,155,165,179],"massive":[44],"parameter":[45,93,219],"updates":[46],"extraction":[49],"and":[50,109,127,167,189,227],"fusion.":[51],"To":[52],"address":[53],"this":[54,96],"issue,":[55],"we":[56,98,222],"propose":[57],"surprisingly":[59],"simple":[60,193],"yet":[61],"effective":[62],"dual-prompt":[63],"learning":[64,102],"network":[65],"(dubbed":[66],"DPLNet)":[67],"training-efficient":[69],"RGBD/T)":[72],"segmentation.":[74,162],"The":[75,242],"core":[76],"of":[77,178],"DPLNet":[78,197,224,237],"directly":[81],"adapt":[82],"frozen":[84,146,156],"pre-trained":[85,180],"RGB":[86],"model":[87],"reducing":[92],"updates.":[94],"For":[95],"purpose,":[97],"present":[99],"two":[100],"prompt":[101,106],"modules,":[103],"comprising":[104],"generator":[107],"(MPG)":[108],"adapter":[112],"(MFA).":[113],"MPG":[114,166],"works":[115],"fuse":[117],"features":[119,153],"from":[120,130],"different":[121],"modalities":[122],"compact":[125],"manner":[126],"inserted":[129],"shallow":[131],"deep":[133],"stages":[134],"generate":[136],"multi-level":[138],"prompts":[140],"that":[141],"are":[142,169,183],"injected":[143],"into":[144],"backbone,":[147],"while":[148,217],"MFA":[149,168],"adapts":[150],"prompted":[151],"backbone":[157,181],"better":[159],"Since":[163],"both":[164],"lightweight,":[170],"only":[171],"few":[173],"trainable":[174],"parameters":[175],"(3.88M,":[176],"4.4%":[177],"parameters)":[182],"introduced":[184],"learning.":[190],"Using":[191],"decoder":[194],"(3.27M":[195],"parameters),":[196],"achieves":[198],"new":[199],"state-of-the-art":[200],"performance":[201],"or":[202],"on":[204,211],"par":[206],"other":[208,230],"four":[212],"RGB-D/T":[213],"datasets":[216],"satisfying":[218],"efficiency.":[220],"Moreover,":[221],"show":[223],"general":[226],"applicable":[228],"tasks.":[233],"Without":[234],"special":[235],"design,":[236],"outperforms":[238],"many":[239],"models.":[241],"source":[243],"code":[244],"can":[245],"be":[246],"found":[247],"at":[248],"https://github.com/ShaohuaDong2021/DPLNet.":[249]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
