{"id":"https://openalex.org/W4393079490","doi":"https://doi.org/10.1109/tip.2024.3378477","title":"Neighbor-Guided Pseudo-Label Generation and Refinement for Single-Frame Supervised Temporal Action Localization","display_name":"Neighbor-Guided Pseudo-Label Generation and Refinement for Single-Frame Supervised Temporal Action Localization","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4393079490","doi":"https://doi.org/10.1109/tip.2024.3378477","pmid":"https://pubmed.ncbi.nlm.nih.gov/38517712"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2024.3378477","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2024.3378477","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102784548","display_name":"Guozhang Li","orcid":"https://orcid.org/0000-0002-7069-7486"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guozhang Li","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067159497","display_name":"De Cheng","orcid":"https://orcid.org/0000-0003-4603-847X"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"De Cheng","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042507268","display_name":"Nannan Wang","orcid":"https://orcid.org/0000-0002-4695-6134"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nannan Wang","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100642867","display_name":"Jie Li","orcid":"https://orcid.org/0000-0001-7950-4233"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Li","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101785348","display_name":"Xinbo Gao","orcid":"https://orcid.org/0000-0003-1443-0776"},"institutions":[{"id":"https://openalex.org/I10535382","display_name":"Chongqing University of Posts and Telecommunications","ror":"https://ror.org/03dgaqz26","country_code":"CN","type":"education","lineage":["https://openalex.org/I10535382"]},{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinbo Gao","raw_affiliation_strings":["School of Electronic Engineering, Xidian University, Xi&#x2019;an, China","Chongqing Key Laboratory of Image Cognition, Chongqing University of Posts and Telecommunications, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Xidian University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I149594827"]},{"raw_affiliation_string":"Chongqing Key Laboratory of Image Cognition, Chongqing University of Posts and Telecommunications, Chongqing, China","institution_ids":["https://openalex.org/I10535382"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5102784548"],"corresponding_institution_ids":["https://openalex.org/I149594827"],"apc_list":null,"apc_paid":null,"fwci":2.4928,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.90000734,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"33","issue":null,"first_page":"2419","last_page":"2430"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7279901504516602},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6716729402542114},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6623510718345642},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5813696980476379},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.5370290279388428},{"id":"https://openalex.org/keywords/k-nearest-neighbors-algorithm","display_name":"k-nearest neighbors algorithm","score":0.5238611698150635},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.47588980197906494},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4440550208091736},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.44082891941070557},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.4382275342941284}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7279901504516602},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6716729402542114},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6623510718345642},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5813696980476379},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.5370290279388428},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.5238611698150635},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.47588980197906494},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4440550208091736},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.44082891941070557},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.4382275342941284},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2024.3378477","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2024.3378477","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:38517712","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38517712","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2022121445","display_name":null,"funder_award_id":"U21A20514","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2452297484","display_name":null,"funder_award_id":"QTZX23042","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G4297946667","display_name":null,"funder_award_id":"U22A2096","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G844604588","display_name":null,"funder_award_id":"62176198","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8946150788","display_name":null,"funder_award_id":"62176195","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G913836228","display_name":null,"funder_award_id":"62036007","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W61928934","https://openalex.org/W1522301498","https://openalex.org/W1927052826","https://openalex.org/W1977814411","https://openalex.org/W2121056381","https://openalex.org/W2193145675","https://openalex.org/W2321611732","https://openalex.org/W2520861906","https://openalex.org/W2593722617","https://openalex.org/W2604113307","https://openalex.org/W2619947201","https://openalex.org/W2799262584","https://openalex.org/W2884293275","https://openalex.org/W2893390896","https://openalex.org/W2895240652","https://openalex.org/W2919974746","https://openalex.org/W2948229620","https://openalex.org/W2960131371","https://openalex.org/W2962709777","https://openalex.org/W2963524571","https://openalex.org/W2964216549","https://openalex.org/W2964274041","https://openalex.org/W2975310793","https://openalex.org/W2983918066","https://openalex.org/W2986407524","https://openalex.org/W2998601171","https://openalex.org/W2998702159","https://openalex.org/W3005655588","https://openalex.org/W3034623254","https://openalex.org/W3035585099","https://openalex.org/W3095669214","https://openalex.org/W3096609285","https://openalex.org/W3106250896","https://openalex.org/W3109715102","https://openalex.org/W3109986575","https://openalex.org/W3110718159","https://openalex.org/W3112040205","https://openalex.org/W3128626728","https://openalex.org/W3162565403","https://openalex.org/W3173212682","https://openalex.org/W3173698268","https://openalex.org/W3174511093","https://openalex.org/W3176444885","https://openalex.org/W3176630873","https://openalex.org/W3180945712","https://openalex.org/W3189379416","https://openalex.org/W3202825210","https://openalex.org/W3203848195","https://openalex.org/W3207927851","https://openalex.org/W3208354063","https://openalex.org/W3211158804","https://openalex.org/W3213436376","https://openalex.org/W3214808272","https://openalex.org/W4205415396","https://openalex.org/W4225352246","https://openalex.org/W4226500165","https://openalex.org/W4226501520","https://openalex.org/W4280634279","https://openalex.org/W4289535637","https://openalex.org/W4301963599","https://openalex.org/W4304945116","https://openalex.org/W4309665692","https://openalex.org/W4310560168","https://openalex.org/W4312305885","https://openalex.org/W4312317576","https://openalex.org/W4312383773","https://openalex.org/W4312440249","https://openalex.org/W4312508181","https://openalex.org/W4312982010","https://openalex.org/W4313013512","https://openalex.org/W4313024697","https://openalex.org/W4313050661","https://openalex.org/W4313128368","https://openalex.org/W4367834746","https://openalex.org/W4386066453","https://openalex.org/W4386076495","https://openalex.org/W6631190155","https://openalex.org/W6678280073","https://openalex.org/W6781063151","https://openalex.org/W6785821353","https://openalex.org/W6787021940","https://openalex.org/W6802864417","https://openalex.org/W6839041728","https://openalex.org/W6847562344","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2148008870","https://openalex.org/W2381195555","https://openalex.org/W2368606575","https://openalex.org/W4246757943","https://openalex.org/W2132753198","https://openalex.org/W2369874856","https://openalex.org/W2182477562","https://openalex.org/W2792185758","https://openalex.org/W2787484455","https://openalex.org/W2119808169"],"abstract_inverted_index":{"Due":[0],"to":[1,100,122,143],"the":[2,45,67,70,108,112,119,155,180,184,196,200,205,211,215],"sparse":[3],"single-frame":[4,48],"annotations,":[5],"current":[6],"Single-Frame":[7],"Temporal":[8],"Action":[9],"Localization":[10],"(SF-TAL)":[11],"methods":[12],"generally":[13],"employ":[14],"threshold-based":[15],"pseudo-label":[16,55,80,87,133,198],"generation":[17,81],"strategies.":[18],"However,":[19],"these":[20,59],"approaches":[21],"suffer":[22],"from":[23],"inefficient":[24],"data":[25],"utilization,":[26],"as":[27],"only":[28],"parts":[29],"of":[30,47,69,172,195],"unlabeled":[31,128],"frames":[32],"with":[33,73,210],"confidence":[34],"scores":[35],"surpassing":[36],"a":[37,92,97,192],"predefined":[38],"threshold":[39],"are":[40],"selected":[41],"for":[42,134,168],"training.":[43],"Moreover,":[44],"variability":[46],"annotations":[49],"and":[50,83,127,130,199,214,236],"unreliable":[51,144],"model":[52,145,206],"predictions":[53,121,158],"introduce":[54],"noise.":[56],"To":[57,147],"address":[58],"challenges,":[60],"we":[61,166,229],"propose":[62],"two":[63],"strategies":[64],"by":[65,118,176,191],"using":[66],"relationship":[68],"video":[71,174],"segments":[72],"their":[74,161],"neighbors':":[75],"1)":[76],"temporal":[77,102],"neighbor-guided":[78,86],"soft":[79,132,186],"(TNPG);":[82],"2)":[84],"semantic":[85,162,169,201],"refinement":[88],"(SNPR).":[89],"TNPG":[90],"utilizes":[91],"local-global":[93],"self-attention":[94,114],"mechanism":[95],"in":[96,179],"transformer":[98],"encoder":[99],"capture":[101],"neighbor":[103],"information":[104,124],"while":[105],"focusing":[106],"on":[107,154,224,233],"whole":[109],"video.":[110],"Then":[111,183],"generated":[113],"map":[115],"is":[116],"multiplied":[117],"network":[120],"propagate":[123],"between":[125],"labeled":[126],"frames,":[129],"produce":[131],"all":[135],"segments.":[136],"Despite":[137],"this,":[138,149],"label":[139],"noise":[140],"persists":[141],"due":[142],"predictions.":[146],"mitigate":[148],"SNPR":[150],"refines":[151],"pseudo-labels":[152,187],"based":[153],"assumption":[156],"that":[157,228],"should":[159],"resemble":[160],"nearest":[163,170,202],"neighbors'.":[164,203],"Specifically,":[165],"search":[167],"neighbors":[171],"each":[173],"segment":[175],"cosine":[177],"similarity":[178],"feature":[181],"space.":[182],"refined":[185,212],"can":[188,207],"be":[189,208],"obtained":[190],"weight":[193],"combination":[194],"original":[197],"Finally,":[204],"trained":[209],"pseudo-labels,":[213],"performance":[216],"has":[217],"been":[218],"greatly":[219],"improved.":[220],"Comprehensive":[221],"experimental":[222],"results":[223],"different":[225],"benchmarks":[226],"show":[227],"achieve":[230],"state-of-the-art":[231],"performances":[232],"THUMOS14,":[234],"ActivityNet1.2,":[235],"ActivityNet1.3":[237],"datasets.":[238]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
