{"id":"https://openalex.org/W7154345416","doi":"https://doi.org/10.48550/arxiv.2604.11140","title":"Sparse Hypergraph-Enhanced Frame-Event Object Detection with Fine-Grained MoE","display_name":"Sparse Hypergraph-Enhanced Frame-Event Object Detection with Fine-Grained MoE","publication_year":2026,"publication_date":"2026-04-13","ids":{"openalex":"https://openalex.org/W7154345416","doi":"https://doi.org/10.48550/arxiv.2604.11140"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.11140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.11140","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133555257","display_name":"Wei Bao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bao, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101778577","display_name":"Yuehan Wang","orcid":"https://orcid.org/0000-0001-8651-4720"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuehan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101817614","display_name":"Tao Zhou","orcid":"https://orcid.org/0000-0001-8195-8998"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Tianhang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133584225","display_name":"Siqi Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Siqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133619999","display_name":"Yue Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Yue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.4902999997138977,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.4902999997138977,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.10509999841451645,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.06279999762773514,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hypergraph","display_name":"Hypergraph","score":0.6069999933242798},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5360999703407288},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.5220000147819519},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.5181999802589417},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.46560001373291016},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4406000077724457},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.420199990272522},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.3797000050544739}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7886999845504761},{"id":"https://openalex.org/C2781221856","wikidata":"https://www.wikidata.org/wiki/Q840247","display_name":"Hypergraph","level":2,"score":0.6069999933242798},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.559499979019165},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5360999703407288},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.5220000147819519},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.5181999802589417},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.46560001373291016},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4406000077724457},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.42089998722076416},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.420199990272522},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.3797000050544739},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.36390000581741333},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.349700003862381},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.34279999136924744},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.34209999442100525},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.2971000075340271},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2678000032901764},{"id":"https://openalex.org/C7545210","wikidata":"https://www.wikidata.org/wiki/Q838123","display_name":"Data redundancy","level":2,"score":0.25429999828338623},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.11140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.11140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Integrating":[0],"frame-based":[1],"RGB":[2,99],"cameras":[3],"with":[4,160],"event":[5,74,101],"streams":[6,75],"offers":[7],"a":[8,45,115,148,161,191,200],"promising":[9],"solution":[10],"for":[11,140,204],"robust":[12],"object":[13,141],"detection":[14,49],"under":[15],"challenging":[16],"dynamic":[17],"conditions.":[18],"However,":[19],"the":[20,70,105,125,177],"inherent":[21,71],"heterogeneity":[22],"and":[23,47,100,145,156,164,171],"data":[24,102],"redundancy":[25],"of":[26,73,109,118,129],"these":[27],"modalities":[28],"often":[29],"lead":[30],"to":[31,76,123,153],"prohibitive":[32],"computational":[33],"overhead":[34],"or":[35],"suboptimal":[36],"feature":[37,173],"fusion.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42,61,113],"propose":[43],"Hyper-FEOD,":[44],"high-performance":[46],"efficient":[48],"framework,":[50],"which":[51,68],"synergistically":[52],"optimizes":[53],"multi-modal":[54],"interaction":[55],"through":[56],"two":[57],"core":[58],"components.":[59],"First,":[60],"introduce":[62],"Sparse":[63],"Hypergraph-enhanced":[64],"Cross-Modal":[65],"Fusion":[66],"(S-HCF),":[67],"leverages":[69],"sparsity":[72],"construct":[77],"an":[78],"event-guided":[79],"activity":[80],"map.":[81],"By":[82],"performing":[83],"high-order":[84],"hypergraph":[85,110,137],"modeling":[86],"exclusively":[87],"on":[88,183],"selected":[89],"motion-critical":[90],"sparse":[91],"tokens,":[92],"S-HCF":[93],"captures":[94],"complex":[95],"non-local":[96],"dependencies":[97],"between":[98],"while":[103,198],"overcoming":[104],"traditional":[106],"complexity":[107],"bottlenecks":[108],"computation.":[111],"Second,":[112],"design":[114],"Fine-Grained":[116],"Mixture":[117],"Experts":[119],"(FG-MoE)":[120],"Enhancement":[121],"module":[122,134],"address":[124],"diverse":[126],"semantic":[127],"requirements":[128],"different":[130],"image":[131],"regions.":[132],"This":[133],"employs":[135],"specialized":[136],"experts":[138],"tailored":[139],"boundaries,":[142],"internal":[143],"textures,":[144],"backgrounds,":[146],"utilizing":[147],"pixel-level":[149],"spatial":[150],"gating":[151],"mechanism":[152],"adaptively":[154],"route":[155],"enhance":[157],"features.":[158],"Combined":[159],"load-balancing":[162],"loss":[163],"zero-initialization":[165],"strategy,":[166],"FG-MoE":[167],"ensures":[168],"stable":[169],"training":[170],"precise":[172],"refinement":[174],"without":[175],"disrupting":[176],"pre-trained":[178],"backbone's":[179],"distribution.":[180],"Experimental":[181],"results":[182],"mainstream":[184],"RGB-Event":[185],"benchmarks":[186],"demonstrate":[187],"that":[188],"Hyper-FEOD":[189],"achieves":[190],"superior":[192],"accuracy-efficiency":[193],"trade-off,":[194],"outperforming":[195],"state-of-the-art":[196],"methods":[197],"maintaining":[199],"lightweight":[201],"footprint":[202],"suitable":[203],"real-time":[205],"edge":[206],"deployment.":[207]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-04-15T00:00:00"}
