{"id":"https://openalex.org/W7147625238","doi":"https://doi.org/10.48550/arxiv.2603.27558","title":"Learning to See through Illumination Extremes with Event Streaming in Multimodal Large Language Models","display_name":"Learning to See through Illumination Extremes with Event Streaming in Multimodal Large Language Models","publication_year":2026,"publication_date":"2026-03-29","ids":{"openalex":"https://openalex.org/W7147625238","doi":"https://doi.org/10.48550/arxiv.2603.27558"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.27558","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27558","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.27558","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132678397","display_name":"Baoheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Baoheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132626406","display_name":"Jiahui Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiahui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132602316","display_name":"Gui Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Gui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132628519","display_name":"Weizhou Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Weizhou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132595987","display_name":"Yixuan Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Yixuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132671378","display_name":"Jun Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029530832","display_name":"Yingxian Chen","orcid":"https://orcid.org/0000-0001-9171-7936"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yingxian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017408024","display_name":"Wilton Fok","orcid":"https://orcid.org/0000-0003-4448-7300"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fok, Wilton W. T.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132608466","display_name":"Xiaojuan Qi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Xiaojuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123484012","display_name":"Hayden Kwok-Hay So","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"So, Hayden Kwok-Hay","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5132678397"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9311000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9311000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.01600000075995922,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.009600000455975533,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6665999889373779},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.6122000217437744},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.59579998254776},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5667999982833862},{"id":"https://openalex.org/keywords/extreme-learning-machine","display_name":"Extreme learning machine","score":0.5029000043869019},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.49950000643730164},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.41769999265670776},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.38940000534057617}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7440000176429749},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6665999889373779},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6654999852180481},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.6122000217437744},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.59579998254776},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5667999982833862},{"id":"https://openalex.org/C2780150128","wikidata":"https://www.wikidata.org/wiki/Q21948731","display_name":"Extreme learning machine","level":3,"score":0.5029000043869019},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.49950000643730164},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.41769999265670776},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.38940000534057617},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3756999969482422},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.37299999594688416},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.35659998655319214},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3343999981880188},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3325999975204468},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.31119999289512634},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.28850001096725464},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.2815000116825104},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.265500009059906},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.2628999948501587},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.27558","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27558","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.27558","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27558","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7256161570549011,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"Large":[1],"Language":[2],"Models":[3],"(MLLMs)":[4],"perform":[5],"strong":[6],"vision-language":[7],"reasoning":[8,35,160],"under":[9,134,161],"standard":[10],"conditions":[11],"but":[12],"fail":[13],"in":[14,85,93,155],"extreme":[15,94,135],"illumination,":[16],"where":[17],"RGB":[18,42],"inputs":[19],"lose":[20],"irrevocable":[21],"structure":[22],"and":[23,66,72,117,131,145,159],"semantics.":[24],"We":[25,96],"propose":[26],"Event-MLLM,":[27],"an":[28,50,73,125],"event-enhanced":[29],"model":[30],"that":[31,62,77,139],"performs":[32],"all-light":[33],"visual":[34],"by":[36],"dynamically":[37],"fusing":[38],"event":[39],"streams":[40],"with":[41,81,105],"frames.":[43],"Two":[44],"key":[45],"components":[46],"drive":[47],"our":[48],"approach:":[49],"Illumination":[51,74],"Indicator":[52],"-":[53,71,122],"a":[54,59,149],"learnable":[55],"signal":[56],"derived":[57],"from":[58],"DINOv2":[60],"branch":[61],"represents":[63],"exposure":[64],"degradation":[65],"adaptively":[67],"modulates":[68],"event-RGB":[69,107],"fusion":[70],"Correction":[75],"Loss":[76],"aligns":[78],"fused":[79],"features":[80],"non-degraded":[82],"(normal-light)":[83],"semantics":[84],"the":[86,98,153],"latent":[87],"space,":[88],"compensating":[89],"for":[90,103,128],"information":[91],"lost":[92],"lighting.":[95,136],"curate":[97],"first":[99],"multi-illumination":[100],"event-instruction":[101],"corpus":[102],"MLLMs,":[104],"2,241":[106],"samples":[108],"(around":[109],"6":[110],"QA":[111],"pairs":[112],"each)":[113],"across":[114],"diverse":[115],"scenes":[116],"17":[118],"brightness":[119],"rates":[120],"(0.05x":[121],"20x),":[123],"plus":[124],"instruct-following":[126],"benchmark":[127],"reasoning,":[129],"counting,":[130],"fine-grained":[132],"recognition":[133],"Experiments":[137],"show":[138],"Event-MLLM":[140],"markedly":[141],"outperforms":[142],"general-purpose,":[143],"illumination-adaptive,":[144],"event-only":[146],"baselines,":[147],"setting":[148],"new":[150],"state":[151],"of":[152],"art":[154],"robust":[156],"multimodal":[157],"perception":[158],"challenging":[162],"illumination.":[163]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
