{"id":"https://openalex.org/W4402979040","doi":"https://doi.org/10.1109/icme57554.2024.10688049","title":"Local-to-Global Self-Consistency Learning for Temporal Action Localization","display_name":"Local-to-Global Self-Consistency Learning for Temporal Action Localization","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4402979040","doi":"https://doi.org/10.1109/icme57554.2024.10688049"},"language":"en","primary_location":{"id":"doi:10.1109/icme57554.2024.10688049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme57554.2024.10688049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102999463","display_name":"Xinyu Xiao","orcid":"https://orcid.org/0009-0006-2655-6287"},"institutions":[{"id":"https://openalex.org/I4210135679","display_name":"Antea Group (France)","ror":"https://ror.org/03kfw6k71","country_code":"FR","type":"company","lineage":["https://openalex.org/I4210101086","https://openalex.org/I4210135679"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Xinyu Xiao","raw_affiliation_strings":["ANT Group"],"affiliations":[{"raw_affiliation_string":"ANT Group","institution_ids":["https://openalex.org/I4210135679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102787531","display_name":"Yun Hu","orcid":"https://orcid.org/0000-0002-8109-0284"},"institutions":[{"id":"https://openalex.org/I30809798","display_name":"ShanghaiTech University","ror":"https://ror.org/030bhh786","country_code":"CN","type":"education","lineage":["https://openalex.org/I30809798"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Hu","raw_affiliation_strings":["ShanghaiTech University"],"affiliations":[{"raw_affiliation_string":"ShanghaiTech University","institution_ids":["https://openalex.org/I30809798"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045424247","display_name":"Eryun Liu","orcid":"https://orcid.org/0000-0002-2344-4283"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Eryun Liu","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102999463"],"corresponding_institution_ids":["https://openalex.org/I4210135679"],"apc_list":null,"apc_paid":null,"fwci":0.5263,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.66303779,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.973800003528595,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6475849151611328},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5829752087593079},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.555509626865387},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44577693939208984},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0696241557598114}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6475849151611328},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5829752087593079},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.555509626865387},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44577693939208984},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0696241557598114},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme57554.2024.10688049","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme57554.2024.10688049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.5099999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1927052826","https://openalex.org/W2336403884","https://openalex.org/W2952524552","https://openalex.org/W2963351448","https://openalex.org/W2963524571","https://openalex.org/W2983918066","https://openalex.org/W2997314266","https://openalex.org/W2997747012","https://openalex.org/W3034623254","https://openalex.org/W3106041614","https://openalex.org/W3128626728","https://openalex.org/W3173459793","https://openalex.org/W3174569083","https://openalex.org/W3176444885","https://openalex.org/W3202076256","https://openalex.org/W4214736059","https://openalex.org/W4312359819","https://openalex.org/W4312508181"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W2358024260"],"abstract_inverted_index":{"The":[0,154],"object":[1],"of":[2,31,40,82,96,160],"temporal":[3,17,41,62],"action":[4,12],"localization":[5],"(TAL)":[6],"is":[7,28,71,105,148],"to":[8,55,73,78,107,116,126,133,140,150],"predict":[9],"the":[10,15,38,57,75,92,109,117,128,136,141,144,152,158],"predefined":[11],"labels":[13],"and":[14,34,64,94,135,173,179,185],"corresponding":[16],"boundary":[18],"in":[19,61,122,163],"a":[20,29,67,88,99],"video.":[21],"It":[22],"can":[23],"be":[24],"found":[25],"that":[26],"TAL":[27],"task":[30],"multi-modal":[32],"modeling":[33,53],"highly":[35],"dependent":[36],"on":[37,177],"effect":[39],"context":[42],"representation.":[43],"Inspired":[44],"by":[45,113],"this":[46],"property,":[47],"we":[48],"propose":[49],"an":[50],"end-to-end":[51],"local-to-global":[52,68],"architecture":[54],"learn":[56,127],"contextual":[58],"consistency":[59,130,138],"information":[60],"sequence":[63,77],"cross-modal.":[65],"Specifically,":[66],"encoding":[69],"Transformer":[70],"applied":[72],"model":[74,170],"video":[76,80],"obtain":[79],"representation":[81],"different":[83,97,123],"time":[84],"scales.":[85],"To":[86],"achieve":[87],"reasonable":[89],"balance":[90],"between":[91],"specificity":[93,121],"correlation":[95],"modalities,":[98],"cross":[100],"semantic":[101,118],"alignment":[102],"(CSA)":[103],"module":[104],"proposed":[106],"re-weight":[108],"encoded":[110],"multi-model":[111],"features":[112],"whether":[114],"attending":[115],"correlations":[119],"or":[120],"modalities.":[124],"Further,":[125],"trans-modal":[129],"from":[131],"local":[132],"global":[134],"uni-modal":[137],"belonging":[139],"same":[142],"category,":[143],"self-consistency":[145],"learning":[146],"(SCL)":[147],"designed":[149],"train":[151],"network.":[153],"experimental":[155],"results":[156],"demonstrate":[157],"significance":[159],"our":[161],"method":[162],"major":[164],"improvements":[165],"upon":[166],"prior":[167],"works.":[168],"Our":[169],"achieves":[171],"68.3%":[172],"37.1%":[174],"average":[175],"mAPs":[176],"THUMOS14":[178],"ActivityNet":[180],"1.3,":[181],"outperforming":[182],"state-of-the-art":[183],"multi-stage":[184],"one-stage":[186],"models.":[187]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
