{"id":"https://openalex.org/W7138346265","doi":"https://doi.org/10.48550/arxiv.2603.13941","title":"Bidirectional Cross-Attention Fusion of High-Res RGB and Low-Res HSI for Multimodal Automated Waste Sorting","display_name":"Bidirectional Cross-Attention Fusion of High-Res RGB and Low-Res HSI for Multimodal Automated Waste Sorting","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138346265","doi":"https://doi.org/10.48550/arxiv.2603.13941"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.13941","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13941","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.13941","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123617378","display_name":"Jonas V. Funk","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Funk, Jonas V.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092740240","display_name":"Lukas Roming","orcid":"https://orcid.org/0009-0006-1330-3117"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Roming, Lukas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129663396","display_name":"Andreas Michel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michel, Andreas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123603752","display_name":"Paul B\u00e4cker","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"B\u00e4cker, Paul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129648393","display_name":"Georg Maier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maier, Georg","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025271723","display_name":"Thomas L\u00e4ngle","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"L\u00e4ngle, Thomas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129695509","display_name":"Markus Klute","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klute, Markus","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5123617378"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.32850000262260437,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.32850000262260437,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.12150000035762787,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.10830000042915344,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.7936999797821045},{"id":"https://openalex.org/keywords/hyperspectral-imaging","display_name":"Hyperspectral imaging","score":0.6725000143051147},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5846999883651733},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.41990000009536743},{"id":"https://openalex.org/keywords/sorting","display_name":"Sorting","score":0.4056999981403351},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4020000100135803},{"id":"https://openalex.org/keywords/spectral-imaging","display_name":"Spectral imaging","score":0.35989999771118164},{"id":"https://openalex.org/keywords/counterfeit","display_name":"Counterfeit","score":0.3598000109195709},{"id":"https://openalex.org/keywords/conveyor-belt","display_name":"Conveyor belt","score":0.358599990606308}],"concepts":[{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.7936999797821045},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6858000159263611},{"id":"https://openalex.org/C159078339","wikidata":"https://www.wikidata.org/wiki/Q959005","display_name":"Hyperspectral imaging","level":2,"score":0.6725000143051147},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6089000105857849},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5846999883651733},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.546999990940094},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.41990000009536743},{"id":"https://openalex.org/C111696304","wikidata":"https://www.wikidata.org/wiki/Q2303697","display_name":"Sorting","level":2,"score":0.4056999981403351},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4020000100135803},{"id":"https://openalex.org/C3232514","wikidata":"https://www.wikidata.org/wiki/Q7575196","display_name":"Spectral imaging","level":2,"score":0.35989999771118164},{"id":"https://openalex.org/C2779356469","wikidata":"https://www.wikidata.org/wiki/Q502918","display_name":"Counterfeit","level":2,"score":0.3598000109195709},{"id":"https://openalex.org/C2777709985","wikidata":"https://www.wikidata.org/wiki/Q770135","display_name":"Conveyor belt","level":2,"score":0.358599990606308},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.3447999954223633},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.3386000096797943},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.33570000529289246},{"id":"https://openalex.org/C205372480","wikidata":"https://www.wikidata.org/wiki/Q210521","display_name":"Image resolution","level":2,"score":0.3353999853134155},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.3237000107765198},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3068000078201294},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.3052000105381012},{"id":"https://openalex.org/C136536468","wikidata":"https://www.wikidata.org/wiki/Q1225894","display_name":"Undersampling","level":2,"score":0.30320000648498535},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2870999872684479},{"id":"https://openalex.org/C176641082","wikidata":"https://www.wikidata.org/wiki/Q2446767","display_name":"Spectral signature","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.26339998841285706},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2599000036716461}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.13941","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13941","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.13941","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13941","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.4019375145435333}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Growing":[0],"waste":[1,13,73],"streams":[2],"and":[3,27,125,148,164,189,224,237],"the":[4,52,149,175],"transition":[5],"to":[6,82,166],"a":[7,119,198],"circular":[8],"economy":[9],"require":[10],"efficient":[11],"automated":[12],"sorting.":[14],"In":[15],"industrial":[16,200],"settings,":[17],"materials":[18,47],"move":[19],"on":[20,208],"fast":[21],"conveyor":[22],"belts,":[23],"where":[24],"reliable":[25],"identification":[26],"ejection":[28],"demand":[29],"pixel-accurate":[30],"segmentation.":[31],"RGB":[32,96,124,145,168,204],"imaging":[33,56],"delivers":[34],"high-resolution":[35,95],"spatial":[36,68],"detail,":[37],"which":[38,93],"is":[39,162],"essential":[40],"for":[41,123,217,227],"accurate":[42],"segmentation,":[43],"but":[44],"it":[45],"confuses":[46],"that":[48,61,78,130],"look":[49],"similar":[50],"in":[51],"visible":[53],"spectrum.":[54],"Hyperspectral":[55],"(HSI)":[57],"provides":[58],"spectral":[59,112,132,138,153],"signatures":[60],"separate":[62],"such":[63],"materials,":[64],"yet":[65],"its":[66],"lower":[67],"resolution":[69,147],"limits":[70],"detail.":[71],"Effective":[72],"sorting":[74],"therefore":[75],"needs":[76],"methods":[77],"fuse":[79],"both":[80],"modalities":[81],"exploit":[83],"their":[84,101],"complementary":[85],"strengths.":[86],"We":[87,140,195],"present":[88],"Bidirectional":[89],"Cross-Attention":[90],"Fusion":[91],"(BCAF),":[92],"aligns":[94],"with":[97,137,169],"low-resolution":[98],"HSI":[99,152],"at":[100,186,192,243],"native":[102],"grids":[103],"via":[104],"localized,":[105],"bidirectional":[106],"cross-attention,":[107],"avoiding":[108],"pre-upsampling":[109],"or":[110],"early":[111],"collapse.":[113],"BCAF":[114,161,179,213],"uses":[115],"two":[116],"independent":[117],"backbones:":[118],"standard":[120],"Swin":[121,128],"Transformer":[122],"an":[126],"HSI-adapted":[127],"backbone":[129],"preserves":[131],"structure":[133],"through":[134],"3D":[135],"tokenization":[136],"self-attention.":[139],"also":[141],"analyze":[142],"trade-offs":[143],"between":[144],"input":[146],"number":[150],"of":[151,183],"slices.":[154],"Although":[155],"our":[156],"evaluation":[157],"targets":[158],"RGB-HSI":[159],"fusion,":[160],"modality-agnostic":[163],"applies":[165],"co-registered":[167],"lower-resolution,":[170],"high-channel":[171],"auxiliary":[172],"sensors.":[173],"On":[174,210],"benchmark":[176],"SpectralWaste":[177],"dataset,":[178,212],"achieves":[180],"state-of-the-art":[181],"performance":[182],"76.4%":[184],"mIoU":[185,191,216,226],"31":[187],"images/s":[188],"75.4%":[190],"55":[193],"images/s.":[194],"further":[196],"evaluate":[197],"novel":[199],"dataset:":[201],"K3I-Cycling":[202],"(first":[203],"subset":[205],"already":[206],"released":[207],"Fordatis).":[209],"this":[211],"reaches":[214],"62.3%":[215],"material":[218],"segmentation":[219,229],"(paper,":[220],"metal,":[221],"plastic,":[222],"etc.)":[223],"66.2%":[225],"plastic-type":[228],"(PET,":[230],"PP,":[231],"HDPE,":[232],"LDPE,":[233],"PS,":[234],"etc.).":[235],"Code":[236],"model":[238],"checkpoints":[239],"are":[240],"publicly":[241],"available":[242],"https://github.com/jonasvilhofunk/BCAF_2026":[244],".":[245]},"counts_by_year":[],"updated_date":"2026-04-15T05:59:14.812645","created_date":"2026-03-18T00:00:00"}
