{"id":"https://openalex.org/W7124899164","doi":"https://doi.org/10.1109/tmm.2026.3655467","title":"Hybrid Debiasing Transformer With Adaptive Regularization for Video Moment Localization","display_name":"Hybrid Debiasing Transformer With Adaptive Regularization for Video Moment Localization","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7124899164","doi":"https://doi.org/10.1109/tmm.2026.3655467"},"language":null,"primary_location":{"id":"doi:10.1109/tmm.2026.3655467","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2026.3655467","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058078587","display_name":"Jiong Yin","orcid":"https://orcid.org/0000-0002-1991-4908"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiong Yin","raw_affiliation_strings":["School of Automation, Hangzhou Dianzi University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-1991-4908","affiliations":[{"raw_affiliation_string":"School of Automation, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123407160","display_name":"Liang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210090176","display_name":"Institute of Computing Technology","ror":"https://ror.org/0090r4d87","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210090176"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Li","raw_affiliation_strings":["Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8437-4824","affiliations":[{"raw_affiliation_string":"Institute of Computing Technology, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210090176","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiehua Zhang","orcid":"https://orcid.org/0000-0003-0790-9279"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiehua Zhang","raw_affiliation_strings":["School of Software Engineering, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0003-0790-9279","affiliations":[{"raw_affiliation_string":"School of Software Engineering, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123374057","display_name":"Chenggang Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenggang Yan","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-1204-0512","affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086371835","display_name":"Hongkui Wang","orcid":"https://orcid.org/0000-0002-4443-798X"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongkui Wang","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-4443-798X","affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048712886","display_name":"Yaoqi Sun","orcid":"https://orcid.org/0000-0001-8874-241X"},"institutions":[{"id":"https://openalex.org/I3129496460","display_name":"Lishui University","ror":"https://ror.org/0418kp584","country_code":"CN","type":"education","lineage":["https://openalex.org/I3129496460"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaoqi Sun","raw_affiliation_strings":["Lishui University, Lishui, China"],"raw_orcid":"https://orcid.org/0000-0001-8874-241X","affiliations":[{"raw_affiliation_string":"Lishui University, Lishui, China","institution_ids":["https://openalex.org/I3129496460"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078069878","display_name":"Zunjie Zhu","orcid":"https://orcid.org/0000-0001-6107-4538"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zunjie Zhu","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-6107-4538","affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, China","institution_ids":["https://openalex.org/I50760025"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07645992,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"3986","last_page":"4001"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7010999917984009,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7010999917984009,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.1386999934911728,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.07760000228881836,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7487999796867371},{"id":"https://openalex.org/keywords/debiasing","display_name":"Debiasing","score":0.701200008392334},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.6819999814033508},{"id":"https://openalex.org/keywords/timestamp","display_name":"Timestamp","score":0.6287999749183655},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.4927000105381012},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4528000056743622},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4239000082015991},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.36559998989105225},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.35269999504089355}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7972999811172485},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7487999796867371},{"id":"https://openalex.org/C2779458634","wikidata":"https://www.wikidata.org/wiki/Q24963715","display_name":"Debiasing","level":2,"score":0.701200008392334},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.6819999814033508},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.6287999749183655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5030999779701233},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.4927000105381012},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4528000056743622},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4239000082015991},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39340001344680786},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.36559998989105225},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36419999599456787},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.35269999504089355},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.3393999934196472},{"id":"https://openalex.org/C179254644","wikidata":"https://www.wikidata.org/wiki/Q13222844","display_name":"Moment (physics)","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C4438859","wikidata":"https://www.wikidata.org/wiki/Q186117","display_name":"Timeline","level":2,"score":0.3199999928474426},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.3190999925136566},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3018999993801117},{"id":"https://openalex.org/C132459708","wikidata":"https://www.wikidata.org/wiki/Q744069","display_name":"Extrapolation","level":2,"score":0.30090001225471497},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.2793999910354614},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2786000072956085},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.2653000056743622},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.2533999979496002},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2026.3655467","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2026.3655467","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4223952293395996,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Video":[0],"Moment":[1],"Localization":[2],"(VML)":[3],"is":[4,72],"a":[5,20,94,100,109,132,156],"task":[6],"that":[7,35],"seeks":[8],"to":[9,74,112,136,161,170,183],"pinpoint":[10],"the":[11,26,43,66,75,79,84,90,146,163,180,185,190,197,204],"most":[12],"pertinent":[13],"segment":[14],"within":[15],"an":[16],"untrimmed":[17],"video":[18],"using":[19],"linguistic":[21,158],"query.":[22],"Previous":[23],"works":[24],"expose":[25],"severe":[27],"data":[28,49],"bias":[29,81,148,187],"issues":[30],"in":[31],"VML":[32],"and":[33,54,65,78,123,144],"note":[34],"models":[36],"avoid":[37],"understanding":[38],"visual-textual":[39],"content":[40],"by":[41,116,150,188],"adapting":[42],"timestamp":[44],"distribution.":[45],"The":[46,57,70],"work":[47],"investigates":[48],"biases":[50],"from":[51,61,83,140,174],"both":[52],"intrinsic":[53,147],"extrinsic":[55],"perspectives:":[56],"former":[58],"arises":[59],"primarily":[60],"moment":[62,127,142],"boundary":[63,114],"ambiguity":[64,115],"inputoutput":[67],"information":[68,139,151],"imbalance.":[69,152],"latter":[71],"attributed":[73],"longtail":[76],"distribution":[77],"semantic":[80,186],"resulting":[82],"limited":[85],"tail":[86,175],"samples.":[87,176],"To":[88],"reduce":[89],"issues,":[91],"we":[92,107,130,154,178],"develop":[93,155],"hybrid":[95,157],"multimodal":[96],"debiasing":[97],"network":[98],"with":[99,126],"temporal":[101,133],"consistency":[102,134],"constraint":[103,135],"for":[104],"VML.":[105],"Firstly,":[106],"propose":[108],"multi-temporal":[110],"Transformer":[111,182],"alleviate":[113,184],"merging":[117],"frame-wise":[118],"features":[119],"into":[120],"segment-wise":[121],"representations":[122],"dynamically":[124],"aligning":[125],"boundaries.":[128],"Subsequently,":[129],"implement":[131],"accentuate":[137],"action":[138],"complex":[141],"context":[143],"mitigate":[145,162],"caused":[149],"Moreover,":[153],"activation":[159],"module":[160],"long-tail":[164],"bias,":[165],"which":[166],"offers":[167],"prior":[168],"guidance":[169],"emphasize":[171],"distinguishing":[172],"clues":[173],"Additionally,":[177],"introduce":[179],"prior-guided":[181],"learning":[189],"global":[191],"semantics":[192],"of":[193,206],"sentences,":[194],"thereby":[195],"circumventing":[196],"tail-sample":[198],"overfitting":[199],"issue.":[200],"Comprehensive":[201],"experiments":[202],"demonstrate":[203],"efficacy":[205],"our":[207],"proposed":[208],"method":[209],"across":[210],"three":[211],"datasets.":[212]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-01-21T00:00:00"}
