{"id":"https://openalex.org/W4387885776","doi":"https://doi.org/10.1109/tcsvt.2023.3326692","title":"Cross Time-Frequency Transformer for Temporal Action Localization","display_name":"Cross Time-Frequency Transformer for Temporal Action Localization","publication_year":2023,"publication_date":"2023-10-23","ids":{"openalex":"https://openalex.org/W4387885776","doi":"https://doi.org/10.1109/tcsvt.2023.3326692"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3326692","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3326692","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100602678","display_name":"Jin Yang","orcid":"https://orcid.org/0000-0001-9625-7449"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jin Yang","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101947241","display_name":"Ping Wei","orcid":"https://orcid.org/0000-0002-8535-9527"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ping Wei","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047405956","display_name":"Nanning Zheng","orcid":"https://orcid.org/0000-0003-1608-8257"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nanning Zheng","raw_affiliation_strings":["National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Human-Machine Hybrid Augmented Intelligence, National Engineering Research Center of Visual Information and Applications, Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100602678"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.4014,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.90900903,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"34","issue":"6","first_page":"4625","last_page":"4638"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10510","display_name":"Stroke Rehabilitation and Recovery","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/2742","display_name":"Rehabilitation"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7483437061309814},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5708451271057129},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5596069097518921},{"id":"https://openalex.org/keywords/time\u2013frequency-analysis","display_name":"Time\u2013frequency analysis","score":0.5528952479362488},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5138023495674133},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4950241446495056},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.44288402795791626},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.4233153164386749},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32784250378608704},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.15279555320739746},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.09154835343360901}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7483437061309814},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5708451271057129},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5596069097518921},{"id":"https://openalex.org/C142433447","wikidata":"https://www.wikidata.org/wiki/Q7806653","display_name":"Time\u2013frequency analysis","level":3,"score":0.5528952479362488},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5138023495674133},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4950241446495056},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.44288402795791626},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.4233153164386749},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32784250378608704},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.15279555320739746},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.09154835343360901},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3326692","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3326692","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G577169378","display_name":null,"funder_award_id":"2018AAA0102501","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1927052826","https://openalex.org/W2132984323","https://openalex.org/W2146048167","https://openalex.org/W2187089797","https://openalex.org/W2336403884","https://openalex.org/W2565639579","https://openalex.org/W2612218357","https://openalex.org/W2618799552","https://openalex.org/W2625366777","https://openalex.org/W2741196023","https://openalex.org/W2755876276","https://openalex.org/W2804005492","https://openalex.org/W2951143549","https://openalex.org/W2952435096","https://openalex.org/W2963095467","https://openalex.org/W2963524571","https://openalex.org/W2963563276","https://openalex.org/W2963857746","https://openalex.org/W2964214371","https://openalex.org/W2964274041","https://openalex.org/W2982770724","https://openalex.org/W2983918066","https://openalex.org/W2986407524","https://openalex.org/W2990503944","https://openalex.org/W2990763144","https://openalex.org/W2991089415","https://openalex.org/W2997314266","https://openalex.org/W2997706915","https://openalex.org/W3034623254","https://openalex.org/W3034971973","https://openalex.org/W3035251589","https://openalex.org/W3035396860","https://openalex.org/W3035588244","https://openalex.org/W3037916678","https://openalex.org/W3069380482","https://openalex.org/W3096609285","https://openalex.org/W3103334733","https://openalex.org/W3106041614","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3151130473","https://openalex.org/W3158201658","https://openalex.org/W3168101492","https://openalex.org/W3168825659","https://openalex.org/W3172347581","https://openalex.org/W3172837290","https://openalex.org/W3173459793","https://openalex.org/W3174569083","https://openalex.org/W3176444885","https://openalex.org/W3201612248","https://openalex.org/W3202076256","https://openalex.org/W3204588463","https://openalex.org/W3205786327","https://openalex.org/W3208474254","https://openalex.org/W4230270698","https://openalex.org/W4287062814","https://openalex.org/W4293094783","https://openalex.org/W4309396261","https://openalex.org/W4310015215","https://openalex.org/W4310921506","https://openalex.org/W4312372834","https://openalex.org/W4312508181","https://openalex.org/W4312832682","https://openalex.org/W4312944418","https://openalex.org/W4327810593","https://openalex.org/W4376607835","https://openalex.org/W4377000601","https://openalex.org/W4385245566","https://openalex.org/W4386057769","https://openalex.org/W4386076085","https://openalex.org/W4388392666","https://openalex.org/W6631190155","https://openalex.org/W6748455662","https://openalex.org/W6751684112","https://openalex.org/W6771062828","https://openalex.org/W6780677595","https://openalex.org/W6791776128","https://openalex.org/W6796237581","https://openalex.org/W6801682309","https://openalex.org/W6841287799","https://openalex.org/W6846726380","https://openalex.org/W6846867676","https://openalex.org/W6849990444","https://openalex.org/W6850826453"],"related_works":["https://openalex.org/W3000097931","https://openalex.org/W2354322770","https://openalex.org/W4237547500","https://openalex.org/W1570848052","https://openalex.org/W2373192430","https://openalex.org/W1947057263","https://openalex.org/W2355447608","https://openalex.org/W1980067354","https://openalex.org/W2033324903","https://openalex.org/W1978333447"],"abstract_inverted_index":{"Most":[0],"modern":[1],"approaches":[2],"in":[3,34,45,81,92,244],"temporal":[4,124],"action":[5],"localization":[6],"(TAL)":[7],"mainly":[8],"focus":[9],"on":[10,168,187,198,202,218],"time":[11,70,83,113,161],"domain":[12],"information,":[13],"while":[14],"neglecting":[15],"the":[16,69,78,82,86,93,120,123,142,160,239,245],"advantages":[17],"of":[18,145,196,227,241],"information":[19,27],"from":[20,28,100,138],"other":[21],"domains.":[22],"How":[23],"to":[24,67,135,237],"effectively":[25],"utilize":[26],"different":[29,101,139,148],"domains":[30],"and":[31,71,85,115,125,177,200,221,229],"their":[32],"interactions":[33],"a":[35,52,105,112,116,129,153,210],"reasonable":[36],"manner":[37],"has":[38],"been":[39],"an":[40,193,224],"attractive":[41],"yet":[42],"challenging":[43,170],"issue":[44],"TAL.":[46,60],"In":[47],"this":[48],"paper,":[49],"we":[50,103],"propose":[51,104],"novel":[53],"cross":[54,106],"time-frequency":[55,107],"Transformer":[56],"model":[57],"(TFFormer)":[58],"for":[59,158],"A":[61],"dual-branch":[62],"network":[63],"architecture":[64],"is":[65,133],"designed":[66,134],"capture":[68],"frequency":[72,94,117,126],"features":[73,99,137,146],"at":[74,147],"multiple":[75],"scales,":[76,140],"using":[77],"multi-scale":[79],"transformer":[80],"branch":[84],"DB1":[87],"Discrete":[88],"Wavelet":[89],"Transform":[90],"(DWT)":[91],"branch.":[95],"To":[96],"fuse":[97],"these":[98,188],"domains,":[102],"attention":[108],"mechanism":[109,132],"that":[110],"includes":[111],"pathway":[114],"pathway,":[118],"enhancing":[119],"interaction":[121],"between":[122],"features.":[127],"Furthermore,":[128],"gated":[130],"control":[131],"aggregate":[136],"characterizing":[141],"respective":[143],"contributions":[144],"scales.":[149],"We":[150,231],"also":[151,214,232],"design":[152],"new":[154],"regression":[155],"loss":[156],"function":[157],"locating":[159],"boundaries.":[162],"Extensive":[163],"experiments":[164],"were":[165],"carried":[166],"out":[167],"four":[169],"benchmark":[171],"datasets,":[172],"including":[173],"two":[174,178],"third-person":[175],"datasets":[176],"first-person":[179],"datasets.":[180,189],"The":[181],"proposed":[182,246],"method":[183],"achieves":[184,192],"impressive":[185],"results":[186,217],"Specifically,":[190],"TFFormer":[191],"average":[194,225],"mAP":[195,226],"23.2%":[197],"Ego4D":[199],"25.6%":[201],"EPIC-Kitchens":[203],"100,":[204],"which":[205],"outperform":[206],"previous":[207],"state-of-the-arts":[208],"by":[209],"large":[211],"margin.":[212],"It":[213],"obtains":[215],"competitive":[216],"ActivityNet":[219],"v1.3":[220],"THUMOS14,":[222],"with":[223],"36.2%":[228],"67.8%.":[230],"conducted":[233],"extensive":[234],"ablation":[235],"studies":[236],"validate":[238],"effectiveness":[240],"each":[242],"component":[243],"method.":[247]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
