{"id":"https://openalex.org/W7164823259","doi":"https://doi.org/10.1145/3805622.3810648","title":"Event-Centric Structural Modeling for Zero-Shot Video Moment Retrieval","display_name":"Event-Centric Structural Modeling for Zero-Shot Video Moment Retrieval","publication_year":2026,"publication_date":"2026-06-15","ids":{"openalex":"https://openalex.org/W7164823259","doi":"https://doi.org/10.1145/3805622.3810648"},"language":null,"primary_location":{"id":"doi:10.1145/3805622.3810648","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810648","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3805622.3810648","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5138680607","display_name":"Xin Li","orcid":"https://orcid.org/0009-0007-7879-4321"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Li","raw_affiliation_strings":["Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0007-7879-4321","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087187938","display_name":"Yongxiu Xu","orcid":"https://orcid.org/0000-0003-2963-0914"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongxiu Xu","raw_affiliation_strings":["Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, Chile"],"raw_orcid":"https://orcid.org/0000-0003-2963-0914","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, Chile","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5138683921","display_name":"Yuyao Kong","orcid":"https://orcid.org/0009-0005-4136-7356"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuyao Kong","raw_affiliation_strings":["Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-4136-7356","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101752081","display_name":"Hongbo Xu","orcid":"https://orcid.org/0000-0002-0258-7840"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongbo Xu","raw_affiliation_strings":["Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0258-7840","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052269317","display_name":"Gaopeng Gou","orcid":"https://orcid.org/0000-0002-3533-4874"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaopeng Gou","raw_affiliation_strings":["Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3533-4874","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038842107","display_name":"Yubin Wang","orcid":"https://orcid.org/0000-0002-6464-3203"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yubin Wang","raw_affiliation_strings":["Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6464-3203","affiliations":[{"raw_affiliation_string":"Institute of Information Engineering\uff0cChinese Academy of Sciences, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.93576333,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1298","last_page":"1307"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8526999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8526999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.06120000034570694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.03460000082850456,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8371999859809875},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6022999882698059},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5961999893188477},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5893999934196472},{"id":"https://openalex.org/keywords/moment","display_name":"Moment (physics)","score":0.566100001335144},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.531499981880188},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5307000279426575},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5120000243186951},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.4823000133037567},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.45210000872612}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8371999859809875},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7178000211715698},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6022999882698059},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5961999893188477},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5893999934196472},{"id":"https://openalex.org/C179254644","wikidata":"https://www.wikidata.org/wiki/Q13222844","display_name":"Moment (physics)","level":2,"score":0.566100001335144},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.541700005531311},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.531499981880188},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5307000279426575},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5120000243186951},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.4823000133037567},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.45210000872612},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4311000108718872},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.42410001158714294},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.4077000021934509},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.3993000090122223},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.382999986410141},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.35679998993873596},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.31060001254081726},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C100675267","wikidata":"https://www.wikidata.org/wiki/Q1371624","display_name":"Background noise","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28679999709129333},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.28600001335144043},{"id":"https://openalex.org/C2776235265","wikidata":"https://www.wikidata.org/wiki/Q18392052","display_name":"Fragment (logic)","level":2,"score":0.2782999873161316},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.2630000114440918},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2549000084400177},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3805622.3810648","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810648","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3805622.3810648","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810648","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7632176280021667,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W2008458232","https://openalex.org/W2027972120","https://openalex.org/W2948958195","https://openalex.org/W2962677524","https://openalex.org/W2963662190","https://openalex.org/W2963916161","https://openalex.org/W2964089981","https://openalex.org/W2964216549","https://openalex.org/W2983918066","https://openalex.org/W2997429269","https://openalex.org/W2998712570","https://openalex.org/W3034743747","https://openalex.org/W3035339529","https://openalex.org/W3152619510","https://openalex.org/W3162694035","https://openalex.org/W3174364033","https://openalex.org/W3199096350","https://openalex.org/W3216763528","https://openalex.org/W4214773477","https://openalex.org/W4221154629","https://openalex.org/W4221167018","https://openalex.org/W4230025115","https://openalex.org/W4283814553","https://openalex.org/W4293083879","https://openalex.org/W4304091802","https://openalex.org/W4312245888","https://openalex.org/W4312402470","https://openalex.org/W4312509824","https://openalex.org/W4319299894","https://openalex.org/W4385572302","https://openalex.org/W4386057806","https://openalex.org/W4386076626","https://openalex.org/W4386083089","https://openalex.org/W4389519587","https://openalex.org/W4390873341","https://openalex.org/W4390873423","https://openalex.org/W4393159289","https://openalex.org/W4394625732","https://openalex.org/W4399418564","https://openalex.org/W4402671548","https://openalex.org/W4409366186","https://openalex.org/W4409581350","https://openalex.org/W7108068597"],"related_works":[],"abstract_inverted_index":{"Zero-Shot":[0],"Video":[1],"Moment":[2],"Retrieval":[3],"(VMR)":[4],"aims":[5],"to":[6,18,56,87,101,131,140],"localize":[7],"a":[8,19,41],"specific":[9],"temporal":[10,33],"segment":[11],"in":[12,52,165],"an":[13,36,115],"untrimmed":[14,37],"video":[15,38],"that":[16,68,159],"corresponds":[17],"natural":[20],"language":[21],"query":[22],"by":[23],"leveraging":[24],"frozen":[25],"vision-language":[26],"models,":[27],"eliminating":[28],"the":[29,66,72,103,106,142,166],"need":[30],"for":[31],"costly":[32],"annotations.":[34],"Fundamentally,":[35],"consists":[39],"of":[40,43,105,145],"sequence":[42],"atomic":[44],"events":[45,59,146],"with":[46,71,127],"varying":[47],"lengths.":[48],"A":[49],"critical":[50],"challenge":[51],"VMR":[53],"is":[54,178],"thus":[55],"disentangle":[57],"these":[58,111],"into":[60],"coherent":[61,90],"candidates":[62],"and":[63,155,169],"accurately":[64],"identify":[65],"one":[67],"best":[69],"aligns":[70],"query.":[73],"However,":[74],"conventional":[75],"methods":[76],"often":[77],"overlook":[78],"this":[79],"inherent":[80],"event":[81,133],"structure:":[82],"rigid":[83,125],"sliding":[84],"windows":[85],"tend":[86],"fragment":[88],"semantically":[89],"events,":[91],"while":[92,147],"uniform":[93],"pooling":[94],"across":[95,173],"frames":[96],"allows":[97],"ambiguous":[98],"boundary":[99,149],"noise":[100],"dilute":[102],"relevance":[104],"discriminative":[107,143],"core.":[108],"To":[109],"mitigate":[110],"issues,":[112],"we":[113,136],"propose":[114],"Event-Centric":[116],"Structural":[117],"Modeling":[118],"(ECSM)":[119],"framework.":[120],"Specifically,":[121],"our":[122,160],"approach":[123],"replaces":[124],"windowing":[126],"adaptive":[128],"global":[129],"segmentation":[130],"preserve":[132],"integrity.":[134],"Furthermore,":[135],"introduce":[137],"Gaussian-based":[138],"weighting":[139],"highlight":[141],"core":[144],"suppressing":[148],"interference.":[150],"Extensive":[151],"experiments":[152],"on":[153],"Charades-STA":[154],"ActivityNet":[156],"Captions":[157],"demonstrate":[158],"method":[161],"achieves":[162],"state-of-the-art":[163],"performance":[164],"training-free":[167],"setting":[168],"exhibits":[170],"robust":[171],"generalization":[172],"diverse":[174],"out-of-distribution":[175],"scenarios.":[176],"Code":[177],"available":[179],"at":[180],"https://github.com/youziizii/ECSM.":[181]},"counts_by_year":[],"updated_date":"2026-06-16T07:37:23.134862","created_date":"2026-06-16T00:00:00"}
