{"id":"https://openalex.org/W7147636128","doi":"https://doi.org/10.48550/arxiv.2603.28414","title":"Unified Restoration-Perception Learning: Maritime Infrared-Visible Image Fusion and Segmentation","display_name":"Unified Restoration-Perception Learning: Maritime Infrared-Visible Image Fusion and Segmentation","publication_year":2026,"publication_date":"2026-03-30","ids":{"openalex":"https://openalex.org/W7147636128","doi":"https://doi.org/10.48550/arxiv.2603.28414"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.28414","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28414","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.28414","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132563986","display_name":"Weichao Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Cai, Weichao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132570368","display_name":"Weiliang Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Weiliang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132684077","display_name":"Biao Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Biao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132702676","display_name":"Chao Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Chao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132593856","display_name":"Fei Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Fei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132553572","display_name":"Bob Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Bob","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5132563986"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9032999873161316,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9032999873161316,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.045099999755620956,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.021199999377131462,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7451000213623047},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6370999813079834},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5253000259399414},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.446399986743927},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.44510000944137573},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.42160001397132874},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3578999936580658}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7451000213623047},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6937000155448914},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6370999813079834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5971999764442444},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5253000259399414},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.446399986743927},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.44510000944137573},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.42890000343322754},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.42160001397132874},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3578999936580658},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.32710000872612},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.30250000953674316},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2648000121116638},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.25529998540878296},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2542000114917755}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.28414","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28414","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.28414","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28414","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6854701042175293,"id":"https://metadata.un.org/sdg/14","display_name":"Life below water"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Marine":[0],"scene":[1],"understanding":[2],"and":[3,12,20,39,61,107,129,148,160,185],"segmentation":[4,131,180],"plays":[5],"a":[6,114,133,139,151,161],"vital":[7],"role":[8],"in":[9,23,84],"maritime":[10,24,102,190],"monitoring":[11],"navigation":[13],"safety.":[14],"However,":[15],"prevalent":[16],"factors":[17],"like":[18],"fog":[19],"strong":[21],"reflections":[22],"environments":[25],"cause":[26],"severe":[27],"image":[28,125],"degradation,":[29],"significantly":[30,182],"compromising":[31],"the":[32,78,91,175],"stability":[33],"of":[34,81],"semantic":[35,62,130],"perception.":[36],"Existing":[37],"restoration":[38],"enhancement":[40],"methods":[41],"typically":[42],"target":[43],"specific":[44],"degradations":[45,83],"or":[46],"focus":[47],"solely":[48],"on":[49,171],"visual":[50],"quality,":[51],"lacking":[52],"end-to-end":[53],"collaborative":[54],"mechanisms":[55],"that":[56,174],"simultaneously":[57],"improve":[58],"structural":[59,149],"recovery":[60],"effectiveness.":[63],"Moreover,":[64],"publicly":[65],"available":[66],"infrared-visible":[67],"datasets":[68],"are":[69],"predominantly":[70],"collected":[71],"from":[72],"urban":[73],"scenes,":[74],"failing":[75],"to":[76,99,122],"capture":[77],"authentic":[79],"characteristics":[80],"coupled":[82],"marine":[85],"environments.":[86],"To":[87],"address":[88],"these":[89],"challenges,":[90],"Infrared-Visible":[92],"Maritime":[93],"Ship":[94],"Dataset":[95],"(IVMSD)":[96],"is":[97,120],"proposed":[98,121,176],"cover":[100],"various":[101],"scenarios":[103],"under":[104,188],"diverse":[105],"weather":[106],"illumination":[108],"conditions.":[109,191],"Building":[110],"upon":[111],"this":[112],"dataset,":[113],"Multi-task":[115],"Complementary":[116,142],"Learning":[117],"Framework":[118],"(MCLF)":[119],"collaboratively":[123],"perform":[124],"restoration,":[126],"multimodal":[127],"fusion,":[128],"within":[132],"unified":[134],"architecture.":[135],"The":[136],"framework":[137],"includes":[138],"Frequency-Spatial":[140],"Enhancement":[141],"(FSEC)":[143],"module":[144,156],"for":[145,157,166],"degradation":[146],"suppression":[147],"enhancement,":[150],"Semantic-Visual":[152],"Consistency":[153],"Attention":[154],"(SVCA)":[155],"semantic-consistent":[158],"guidance,":[159],"cross-modality":[162],"guided":[163],"attention":[164],"mechanism":[165],"selective":[167],"fusion.":[168],"Experimental":[169],"results":[170],"IVMSD":[172],"demonstrate":[173],"method":[177],"achieves":[178],"state-of-the-art":[179],"performance,":[181],"enhancing":[183],"robustness":[184],"perceptual":[186],"quality":[187],"complex":[189]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
