{"id":"https://openalex.org/W7134041463","doi":"https://doi.org/10.1016/j.patcog.2026.113429","title":"P3D: Plug-and-play prompt-driven framework for RGB-thermal semantic segmentation","display_name":"P3D: Plug-and-play prompt-driven framework for RGB-thermal semantic segmentation","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7134041463","doi":"https://doi.org/10.1016/j.patcog.2026.113429"},"language":"en","primary_location":{"id":"doi:10.1016/j.patcog.2026.113429","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.113429","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.patcog.2026.113429","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yongqi Sun","orcid":"https://orcid.org/0009-0000-5104-8184"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongqi Sun","raw_affiliation_strings":["Information Engineering University, Zhengzhou, 450001, China"],"raw_orcid":"https://orcid.org/0009-0000-5104-8184","affiliations":[{"raw_affiliation_string":"Information Engineering University, Zhengzhou, 450001, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020207163","display_name":"Chenguang Dai","orcid":"https://orcid.org/0000-0003-4681-3851"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenguang Dai","raw_affiliation_strings":["Information Engineering University, Zhengzhou, 450001, China"],"raw_orcid":"https://orcid.org/0000-0003-4681-3851","affiliations":[{"raw_affiliation_string":"Information Engineering University, Zhengzhou, 450001, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122845172","display_name":"Hanyun Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanyun Wang","raw_affiliation_strings":["Sun Yat-sen University, Shenzhen, 518107, China"],"raw_orcid":"https://orcid.org/0000-0002-8320-4230","affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Shenzhen, 518107, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058116832","display_name":"Longguang Wang","orcid":"https://orcid.org/0000-0003-0429-0263"},"institutions":[{"id":"https://openalex.org/I4210167232","display_name":"PLA Air Force Aviation University","ror":"https://ror.org/031g2ra50","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210167232"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longguang Wang","raw_affiliation_strings":["Aviation University of Air Force, Changchun, 130022, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aviation University of Air Force, Changchun, 130022, China","institution_ids":["https://openalex.org/I4210167232"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045714134","display_name":"W. J. Li","orcid":null},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenke Li","raw_affiliation_strings":["Information Engineering University, Zhengzhou, 450001, China"],"raw_orcid":"https://orcid.org/0009-0004-7285-3026","affiliations":[{"raw_affiliation_string":"Information Engineering University, Zhengzhou, 450001, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000973540","display_name":"Meilin Li","orcid":"https://orcid.org/0000-0003-3732-962X"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meilin Li","raw_affiliation_strings":["Information Engineering University, Zhengzhou, 450001, China"],"raw_orcid":"https://orcid.org/0000-0003-3732-962X","affiliations":[{"raw_affiliation_string":"Information Engineering University, Zhengzhou, 450001, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128244123","display_name":"Yongsheng Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongsheng Zhang","raw_affiliation_strings":["Information Engineering University, Zhengzhou, 450001, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Information Engineering University, Zhengzhou, 450001, China","institution_ids":["https://openalex.org/I169689159"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069652653","display_name":"Anzhu Yu","orcid":"https://orcid.org/0000-0002-3332-9668"},"institutions":[{"id":"https://openalex.org/I169689159","display_name":"PLA Information Engineering University","ror":"https://ror.org/00mm1qk40","country_code":"CN","type":"education","lineage":["https://openalex.org/I169689159"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Anzhu Yu","raw_affiliation_strings":["Information Engineering University, Zhengzhou, 450001, China"],"raw_orcid":"https://orcid.org/0000-0002-3332-9668","affiliations":[{"raw_affiliation_string":"Information Engineering University, Zhengzhou, 450001, China","institution_ids":["https://openalex.org/I169689159"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5020207163"],"corresponding_institution_ids":["https://openalex.org/I169689159"],"apc_list":{"value":2710,"currency":"USD","value_usd":2710},"apc_paid":{"value":2710,"currency":"USD","value_usd":2710},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41467408,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"178","issue":null,"first_page":"113429","last_page":"113429"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5785999894142151,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5785999894142151,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12994","display_name":"Infrared Thermography in Medicine","score":0.09030000120401382,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.027499999850988388,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.7692999839782715},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6198999881744385},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6132000088691711},{"id":"https://openalex.org/keywords/semantic-mapping","display_name":"Semantic mapping","score":0.44200000166893005},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.39419999718666077},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.3828999996185303},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3675999939441681},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.36660000681877136},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3653999865055084}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8381999731063843},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.7692999839782715},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6341000199317932},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6198999881744385},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6132000088691711},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.44200000166893005},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.39419999718666077},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.38339999318122864},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.3828999996185303},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3675999939441681},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.36660000681877136},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3653999865055084},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3562000095844269},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35589998960494995},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3538999855518341},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.3528999984264374},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.3513000011444092},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.3458999991416931},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3418000042438507},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.2849000096321106},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.26829999685287476},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.25440001487731934},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.patcog.2026.113429","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.113429","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.patcog.2026.113429","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.113429","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1439962409","display_name":null,"funder_award_id":"62301601,42271457","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4052271284","display_name":null,"funder_award_id":"42571527","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4168836438","display_name":null,"funder_award_id":"221100211000-02","funder_id":"https://openalex.org/F4320330206","funder_display_name":"Science and Technology Program of Hunan Province"},{"id":"https://openalex.org/G4301157100","display_name":null,"funder_award_id":"20250102209JC","funder_id":"https://openalex.org/F4320327282","funder_display_name":"Department of Science and Technology of Jilin Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320327282","display_name":"Department of Science and Technology of Jilin Province","ror":null},{"id":"https://openalex.org/F4320330206","display_name":"Science and Technology Program of Hunan Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2896014703","https://openalex.org/W2910187721","https://openalex.org/W2921749009","https://openalex.org/W3033020497","https://openalex.org/W3198062544","https://openalex.org/W4285290430","https://openalex.org/W4303946404","https://openalex.org/W4381300351","https://openalex.org/W4382567565","https://openalex.org/W4386179772","https://openalex.org/W4386275800","https://openalex.org/W4390489106","https://openalex.org/W4394863092","https://openalex.org/W4398224523","https://openalex.org/W4402043206","https://openalex.org/W4403828029","https://openalex.org/W4406786999","https://openalex.org/W4410539708","https://openalex.org/W4414196945","https://openalex.org/W4416749171"],"related_works":[],"abstract_inverted_index":{"\u2022":[0,10,19],"A":[1,20],"plug-and-play":[2,120,317],"prompt-driven":[3],"framework":[4,123],"for":[5,14,28,38,109,137,175,251],"RGB-thermal":[6,34,99],"image":[7,173,180],"semantic":[8,31,100,216],"segmentation.":[9],"LoRA-based":[11],"fine-tuning":[12],"strategy":[13,150],"SAM":[15,194],"series":[16,195],"model":[17,52,85],"integration.":[18],"model-agnostic":[21,148,227],"encoder":[22,174,208],"to":[23,54,68,106,184,242],"generate":[24],"statistical":[25],"distributed":[26],"prompts":[27,214,225,250],"training.":[29],"The":[30],"segmentation":[32,72,101],"of":[33,274,315],"images":[35,248],"is":[36,127,144,182,209,240],"critical":[37],"applications":[39],"with":[40,79,146,158,230],"low-light":[41],"conditions.":[42],"Existing":[43],"works":[44],"primarily":[45],"focus":[46],"on":[47,259],"feature":[48],"fusion":[49],"strategies":[50],"and":[51,71,91,98,155,178,189,205,228,249],"design":[53],"enhance":[55],"performance.":[56],"While":[57],"Visual":[58],"Foundation":[59],"Models":[60],"(VFMs)":[61],"have":[62],"been":[63],"introduced":[64],"in":[65,116],"previous":[66],"studies":[67],"improve":[69],"generalization":[70],"accuracy,":[73],"they":[74],"suffer":[75],"from":[76,246],"poor":[77],"compatibility":[78],"other":[80],"models":[81,196,276],"thus":[82],"requiring":[83,163],"full":[84],"retraining.":[86,164],"Additionally,":[87],"the":[88,176,186,219,223,244,252,272,312],"domain":[89,187],"gap":[90,93,188,191],"modality":[92,190],"between":[94],"VFM":[95,107],"pre-training":[96],"datasets":[97,102],"pose":[103],"significant":[104,303],"challenges":[105],"adaptation":[108],"downstream":[110],"tasks.":[111],"To":[112],"address":[113],"these":[114,308],"issues,":[115],"this":[117],"paper":[118],"a":[119,147,166,201,234],"prompt":[121,203],"driven":[122],"P":[124,141,266,294],"3":[125,142,267,295],"D":[126,143,268,296],"proposed.":[128,210],"Unlike":[129],"existing":[130,160,231,275,298],"VFM-based":[131],"methods":[132,161,283],"that":[133,151,265],"require":[134],"complete":[135],"retraining":[136,307],"each":[138],"specific":[139],"architecture,":[140],"designed":[145],"training":[149,154,220],"enables":[152],"one-time":[153],"seamless":[156],"integration":[157],"various":[159],"without":[162,306],"First,":[165],"dual-branch":[167],"LoRA":[168],"(Low-Rank":[169],"Adaptation)":[170],"fine-tuned":[171],"(DBLF)":[172],"RGB":[177],"thermal":[179],"branches":[181],"proposed":[183],"narrow":[185],"when":[192],"incorporating":[193],"into":[197,297],"our":[198,316],"task.":[199],"Second,":[200],"unified":[202],"generation":[204],"representation":[206],"(UPGR)":[207],"It":[211],"generates":[212],"diverse":[213],"using":[215],"labels":[217],"during":[218],"stage,":[221],"ensuring":[222],"generated":[224],"are":[226,257],"compatible":[229],"methods.":[232],"Finally,":[233],"cross-modality":[235],"spatial-channel":[236],"attention":[237],"(CM-SCA)":[238],"decoder":[239],"developed":[241],"fuse":[243],"embeddings":[245],"two-modality":[247],"final":[253],"prediction.":[254],"Extensive":[255],"experiments":[256],"conducted":[258],"three":[260],"popular":[261],"benchmarks.":[262],"Results":[263],"demonstrate":[264],"not":[269],"only":[270],"improves":[271],"performance":[273,304],"but":[277],"also":[278],"outperforms":[279],"current":[280],"state-of-the-art":[281],"(SOTA)":[282],"leveraging":[284],"<":[285],"1%":[286],"trainable":[287],"parameters.":[288],"More":[289],"importantly,":[290],"by":[291],"simply":[292],"plugging":[293],"methods,":[299],"we":[300],"consistently":[301],"achieve":[302],"improvements":[305],"base":[309],"models,":[310],"demonstrating":[311],"practical":[313],"value":[314],"design.":[318]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-07T00:00:00"}
