{"id":"https://openalex.org/W4399073780","doi":"https://doi.org/10.1109/tcsvt.2024.3406546","title":"Free-Form Composition Networks for Egocentric Action Recognition","display_name":"Free-Form Composition Networks for Egocentric Action Recognition","publication_year":2024,"publication_date":"2024-05-28","ids":{"openalex":"https://openalex.org/W4399073780","doi":"https://doi.org/10.1109/tcsvt.2024.3406546"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3406546","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tcsvt.2024.3406546","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100324809","display_name":"Haoran Wang","orcid":"https://orcid.org/0000-0001-6350-5645"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haoran Wang","raw_affiliation_strings":["College of Information Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100828963","display_name":"Qinghua Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qinghua Cheng","raw_affiliation_strings":["College of Information Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085309099","display_name":"Baosheng Yu","orcid":"https://orcid.org/0000-0002-0761-7893"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Baosheng Yu","raw_affiliation_strings":["School of Computer Science, Faculty of Engineering, The University of Sydney, Sydney, NSW, Australia","Faculty of Engineering, School of Computer Science, The University of Sydney, Darlington, NSW, Australia"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, Faculty of Engineering, The University of Sydney, Sydney, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]},{"raw_affiliation_string":"Faculty of Engineering, School of Computer Science, The University of Sydney, Darlington, NSW, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074672983","display_name":"Yibing Zhan","orcid":"https://orcid.org/0000-0003-3180-0484"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibing Zhan","raw_affiliation_strings":["JD Explore Academy, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD Explore Academy, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067600725","display_name":"Dapeng Tao","orcid":"https://orcid.org/0000-0003-0783-5273"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dapeng Tao","raw_affiliation_strings":["School of Information Science and Engineering, Yunnan University, Kunming, Yunnan, China","Yunnan United Vision Technology Co.Ltd, and Yunnan Key Laboratory of Media Convergence, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Yunnan University, Kunming, Yunnan, China","institution_ids":["https://openalex.org/I189210763"]},{"raw_affiliation_string":"Yunnan United Vision Technology Co.Ltd, and Yunnan Key Laboratory of Media Convergence, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100456723","display_name":"Liang Ding","orcid":"https://orcid.org/0000-0001-8976-2084"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Ding","raw_affiliation_strings":["JD Explore Academy, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD Explore Academy, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061469520","display_name":"Haibin Ling","orcid":"https://orcid.org/0000-0003-4094-8413"},"institutions":[{"id":"https://openalex.org/I59553526","display_name":"Stony Brook University","ror":"https://ror.org/05qghxh33","country_code":"US","type":"education","lineage":["https://openalex.org/I59553526"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haibin Ling","raw_affiliation_strings":["Department of Computer Science, Stony Brook University, Stony Brook, NY, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Stony Brook University, Stony Brook, NY, USA","institution_ids":["https://openalex.org/I59553526"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100324809"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":0.275,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49112926,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"34","issue":"10","first_page":"9967","last_page":"9978"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6433555483818054},{"id":"https://openalex.org/keywords/composition","display_name":"Composition (language)","score":0.48487553000450134},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48367151618003845},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.4740928113460541},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.45870599150657654},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43712273240089417},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3669625520706177}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6433555483818054},{"id":"https://openalex.org/C40231798","wikidata":"https://www.wikidata.org/wiki/Q1333743","display_name":"Composition (language)","level":2,"score":0.48487553000450134},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48367151618003845},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.4740928113460541},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.45870599150657654},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43712273240089417},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3669625520706177},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3406546","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tcsvt.2024.3406546","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1115950578","display_name":null,"funder_award_id":"N2304012","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":85,"referenced_works":["https://openalex.org/W114517082","https://openalex.org/W1940585053","https://openalex.org/W1947050545","https://openalex.org/W2070999216","https://openalex.org/W2167626157","https://openalex.org/W2194775991","https://openalex.org/W2269938945","https://openalex.org/W2557269700","https://openalex.org/W2605973302","https://openalex.org/W2625022521","https://openalex.org/W2625366777","https://openalex.org/W2736809457","https://openalex.org/W2752912576","https://openalex.org/W2806331055","https://openalex.org/W2895299763","https://openalex.org/W2896659472","https://openalex.org/W2897187502","https://openalex.org/W2904008038","https://openalex.org/W2917792613","https://openalex.org/W2948058585","https://openalex.org/W2962895364","https://openalex.org/W2963082988","https://openalex.org/W2963224792","https://openalex.org/W2963514444","https://openalex.org/W2963524571","https://openalex.org/W2963601560","https://openalex.org/W2963853051","https://openalex.org/W2964118342","https://openalex.org/W2964222622","https://openalex.org/W2971680695","https://openalex.org/W2982277552","https://openalex.org/W2986364431","https://openalex.org/W2990152177","https://openalex.org/W2990503944","https://openalex.org/W2997004687","https://openalex.org/W3011334834","https://openalex.org/W3034257141","https://openalex.org/W3034369739","https://openalex.org/W3034973071","https://openalex.org/W3035179769","https://openalex.org/W3048602385","https://openalex.org/W3090590592","https://openalex.org/W3096688134","https://openalex.org/W3098028994","https://openalex.org/W3109754877","https://openalex.org/W3155644662","https://openalex.org/W3168279596","https://openalex.org/W3169024950","https://openalex.org/W3175123126","https://openalex.org/W3175528717","https://openalex.org/W3195479307","https://openalex.org/W3197395033","https://openalex.org/W3202237431","https://openalex.org/W3202241806","https://openalex.org/W3202801842","https://openalex.org/W3203574385","https://openalex.org/W3203770998","https://openalex.org/W3204691786","https://openalex.org/W3206930349","https://openalex.org/W3207758636","https://openalex.org/W3211407538","https://openalex.org/W4206654595","https://openalex.org/W4214899942","https://openalex.org/W4220932801","https://openalex.org/W4281752744","https://openalex.org/W4282964635","https://openalex.org/W4285453420","https://openalex.org/W4288062562","https://openalex.org/W4307079049","https://openalex.org/W4312372834","https://openalex.org/W4312710666","https://openalex.org/W4312757006","https://openalex.org/W4312848112","https://openalex.org/W4312894178","https://openalex.org/W4313118515","https://openalex.org/W4386071518","https://openalex.org/W4386076314","https://openalex.org/W4386083076","https://openalex.org/W4390872179","https://openalex.org/W6637373629","https://openalex.org/W6726873649","https://openalex.org/W6766978945","https://openalex.org/W6785527955","https://openalex.org/W6797206543","https://openalex.org/W6845973410"],"related_works":["https://openalex.org/W1499958165","https://openalex.org/W2380193321","https://openalex.org/W2041489351","https://openalex.org/W2367936492","https://openalex.org/W2588831577","https://openalex.org/W2749776132","https://openalex.org/W4229073194","https://openalex.org/W3130838260","https://openalex.org/W1576128429","https://openalex.org/W2269464716"],"abstract_inverted_index":{"Egocentric":[0],"action":[1,12,24,68,86,92,188,199,228],"recognition":[2,25,189,200],"is":[3,159],"gaining":[4],"significant":[5],"attention":[6],"in":[7,22,60,84,106,134,154],"the":[8,61,77,103,107,122,208,212,215],"field":[9],"of":[10,67,96,141,166,214],"human":[11],"recognition.":[13,229],"In":[14],"this":[15,33],"paper,":[16],"we":[17,35,71,145],"address":[18],"data":[19,180,220],"scarcity":[20,221],"issue":[21],"egocentric":[23,198,227],"from":[26,117,131],"a":[27,37,73,94,155,163,167,170],"compositional":[28],"generalization":[29],"perspective.":[30],"To":[31],"tackle":[32],"problem,":[34],"propose":[36],"free-form":[38,156],"composition":[39],"network":[40],"(FFCN)":[41],"that":[42],"can":[43,146,175],"simultaneously":[44],"learn":[45],"disentangled":[46],"verb,":[47],"preposition,":[48],"and":[49,52,98,114,128,143,169,205,207,225],"noun":[50],"representations,":[51],"then":[53],"use":[54,72],"them":[55],"to":[56,75,162],"compose":[57,147],"new":[58,148,178],"samples":[59,149,181],"feature":[62],"space":[63],"for":[64,150,182,218],"rare":[65,152,183],"classes":[66,153],"videos.":[69],"First,":[70],"graph":[74],"capture":[76],"spatial-temporal":[78,100,139],"relations":[79],"among":[80],"different":[81,118],"hand/object":[82],"instances":[83,133],"each":[85,91,135],"video.":[87],"We":[88,191],"thus":[89],"decompose":[90],"into":[93],"set":[95],"verb":[97,113,127,168],"preposition":[99,115,129],"representations":[101,116,130,140],"using":[102],"edge":[104],"features":[105],"graph.":[108],"The":[109,172],"temporal":[110],"decomposition":[111,124],"extracts":[112],"video":[119],"frames,":[120],"while":[121],"spatial":[123],"adaptively":[125],"learns":[126],"action-related":[132],"frame.":[136],"With":[137],"these":[138],"verbs":[142],"prepositions,":[144],"those":[151],"manner,":[157],"which":[158],"not":[160],"restricted":[161],"rigid":[164],"form":[165],"noun.":[171],"proposed":[173,216],"FFCN":[174],"directly":[176],"generate":[177],"training":[179],"classes,":[184],"hence":[185],"significantly":[186],"improve":[187],"performance.":[190],"evaluated":[192],"our":[193],"method":[194,217],"on":[195],"three":[196],"popular":[197],"datasets,":[201],"Something-Something":[202],"V2,":[203],"H2O,":[204],"EPIC-KITCHENS-100,":[206],"experimental":[209],"results":[210],"demonstrate":[211],"effectiveness":[213],"handling":[219],"problems,":[222],"including":[223],"long-tailed":[224],"few-shot":[226]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
