{"id":"https://openalex.org/W7160957487","doi":"https://doi.org/10.48550/arxiv.2605.10228","title":"FLARE: Full-Modality Long-Video Audiovisual Retrieval Benchmark with User-Simulated Queries","display_name":"FLARE: Full-Modality Long-Video Audiovisual Retrieval Benchmark with User-Simulated Queries","publication_year":2026,"publication_date":"2026-05-11","ids":{"openalex":"https://openalex.org/W7160957487","doi":"https://doi.org/10.48550/arxiv.2605.10228"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.10228","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10228","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.10228","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120442906","display_name":"Qijie You","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"You, Qijie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135964521","display_name":"Hao Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135919863","display_name":"Mingrui Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Mingrui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135956653","display_name":"Bohan Zeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Bohan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120132025","display_name":"Meiyi Qiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiang, Meiyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136000026","display_name":"Zhenhao Wong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wong, Zhenhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135913403","display_name":"Wentao Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Wentao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8432000279426575,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8432000279426575,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.07440000027418137,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.019899999722838402,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6523000001907349},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5627999901771545},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.555400013923645},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5205000042915344},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5110999941825867},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.4756999909877777},{"id":"https://openalex.org/keywords/data-retrieval","display_name":"Data retrieval","score":0.40709999203681946},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.3862999975681305}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8468999862670898},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6712999939918518},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6523000001907349},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5627999901771545},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.555400013923645},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5205000042915344},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5110999941825867},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.4756999909877777},{"id":"https://openalex.org/C551230270","wikidata":"https://www.wikidata.org/wiki/Q4368942","display_name":"Data retrieval","level":2,"score":0.40709999203681946},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3862999975681305},{"id":"https://openalex.org/C2983174267","wikidata":"https://www.wikidata.org/wiki/Q3775098","display_name":"Video retrieval","level":2,"score":0.3621000051498413},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3481999933719635},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.31360000371932983},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.30079999566078186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29190000891685486},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.28760001063346863},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2791000008583069},{"id":"https://openalex.org/C2778739407","wikidata":"https://www.wikidata.org/wiki/Q165372","display_name":"CLIPS","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.26510000228881836},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2587999999523163}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.10228","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10228","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.10228","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.10228","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"video":[1,18],"becomes":[2],"increasingly":[3,22],"central":[4],"to":[5,15,34,81,116,165],"information":[6],"dissemination":[7],"and":[8,40,55,85,95,135,141,168,181],"multimodal":[9],"large":[10],"language":[11],"models":[12,130],"(MLLMs)":[13],"continue":[14],"advance,":[16],"evaluating":[17],"retrieval":[19,45,65,115],"has":[20],"become":[21],"important.":[23],"In":[24],"realistic":[25],"search":[26],"scenarios,":[27],"this":[28],"requires":[29],"matching":[30],"short":[31,51],"user":[32],"queries":[33,105,153],"long-form":[35],"content":[36],"using":[37],"both":[38,125],"visual":[39],"auditory":[41],"evidence.":[42],"Yet":[43],"existing":[44],"benchmarks":[46],"are":[47,106,126,183],"still":[48],"dominated":[49],"by":[50,109],"clips,":[52],"single":[53],"modalities,":[54],"caption-based":[56,134,159],"evaluation.":[57],"We":[58],"introduce":[59],"FLARE,":[60],"a":[61,110,172],"full-modality":[62],"long-video":[63],"audiovisual":[64,97,143,177],"benchmark":[66],"with":[67,92,100,146],"user-simulated":[68],"queries.":[69,103],"Built":[70],"from":[71],"399":[72],"carefully":[73],"screened":[74],"Video-MME":[75],"videos":[76],"(10--60":[77],"min,":[78],"225.4":[79],"h)":[80],"ensure":[82],"source":[83],"quality":[84],"diversity,":[86],"FLARE":[87,128],"contains":[88],"87,697":[89],"clips":[90],"annotated":[91],"vision,":[93,139],"audio,":[94,140],"unified":[96,142,176],"captions,":[98],"together":[99],"274,933":[101],"user-style":[102,152],"Cross-modal":[104],"further":[107],"filtered":[108],"hard":[111],"bimodal":[112],"constraint,":[113],"requiring":[114],"fail":[117],"under":[118,131],"either":[119],"modality":[120],"alone":[121],"but":[122],"succeed":[123],"when":[124],"combined.":[127],"evaluates":[129],"two":[132],"regimes,":[133],"query-based":[136,166],"retrieval,":[137,167],"across":[138],"settings.":[144],"Experiments":[145],"15":[147],"representative":[148],"retrievers":[149],"show":[150],"that":[151],"substantially":[154],"change":[155],"model":[156],"behavior,":[157],"strong":[158],"performance":[160],"does":[161],"not":[162],"always":[163],"transfer":[164],"audio--language":[169],"alignment":[170],"remains":[171],"key":[173],"bottleneck":[174],"for":[175],"retrieval.":[178],"Our":[179],"code":[180],"data":[182],"released":[184],"at":[185],"https://flarebench.github.io/":[186]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-13T00:00:00"}
