{"id":"https://openalex.org/W3119381934","doi":"https://doi.org/10.1109/tpami.2021.3049156","title":"Cascaded Parsing of Human-Object Interaction Recognition","display_name":"Cascaded Parsing of Human-Object Interaction Recognition","publication_year":2021,"publication_date":"2021-01-05","ids":{"openalex":"https://openalex.org/W3119381934","doi":"https://doi.org/10.1109/tpami.2021.3049156","mag":"3119381934","pmid":"https://pubmed.ncbi.nlm.nih.gov/33400648"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2021.3049156","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3049156","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091518967","display_name":"Tianfei Zhou","orcid":"https://orcid.org/0000-0001-5475-1473"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Tianfei Zhou","raw_affiliation_strings":["ETH Zurich, Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043510420","display_name":"Siyuan Qi","orcid":"https://orcid.org/0000-0002-4070-733X"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Siyuan Qi","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101433884","display_name":"Wenguan Wang","orcid":"https://orcid.org/0000-0002-0802-9567"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Wenguan Wang","raw_affiliation_strings":["ETH Zurich, Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102851352","display_name":"Jianbing Shen","orcid":"https://orcid.org/0000-0003-2656-3082"},"institutions":[{"id":"https://openalex.org/I204512498","display_name":"University of Macau","ror":"https://ror.org/01r4q9n85","country_code":"MO","type":"education","lineage":["https://openalex.org/I204512498"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Jianbing Shen","raw_affiliation_strings":["State Key Laboratory of IOTSC, Department of Computer and Information Science, University of Macau, Macau, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of IOTSC, Department of Computer and Information Science, University of Macau, Macau, China","institution_ids":["https://openalex.org/I204512498"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034228010","display_name":"Song\u2010Chun Zhu","orcid":"https://orcid.org/0009-0008-0876-8117"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Song-Chun Zhu","raw_affiliation_strings":["Tsinghua University, Beijing, China","Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5091518967"],"corresponding_institution_ids":["https://openalex.org/I35440088"],"apc_list":null,"apc_paid":null,"fwci":9.883,"has_fulltext":false,"cited_by_count":118,"citation_normalized_percentile":{"value":0.98732659,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"44","issue":"6","first_page":"2827","last_page":"2840"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.799127459526062},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7529277205467224},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6121271848678589},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5649279356002808},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5009438991546631},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4966619610786438},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.48851263523101807},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.4555432200431824},{"id":"https://openalex.org/keywords/scene-graph","display_name":"Scene graph","score":0.442920982837677},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.42580947279930115},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3525328040122986},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3504706621170044},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3312034010887146},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2775209844112396},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.14640843868255615},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.12976425886154175}],"concepts":[{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.799127459526062},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7529277205467224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6121271848678589},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5649279356002808},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5009438991546631},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4966619610786438},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.48851263523101807},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.4555432200431824},{"id":"https://openalex.org/C179372163","wikidata":"https://www.wikidata.org/wiki/Q1406181","display_name":"Scene graph","level":3,"score":0.442920982837677},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.42580947279930115},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3525328040122986},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3504706621170044},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3312034010887146},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2775209844112396},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.14640843868255615},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.12976425886154175},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014796","descriptor_name":"Visual Perception","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014796","descriptor_name":"Visual Perception","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D014796","descriptor_name":"Visual Perception","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2021.3049156","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3049156","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:33400648","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33400648","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.44999998807907104,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":96,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1517303303","https://openalex.org/W1536680647","https://openalex.org/W1551928752","https://openalex.org/W1861492603","https://openalex.org/W2024060531","https://openalex.org/W2036989445","https://openalex.org/W2038765747","https://openalex.org/W2050964073","https://openalex.org/W2106833577","https://openalex.org/W2116341502","https://openalex.org/W2131984901","https://openalex.org/W2136391815","https://openalex.org/W2147474239","https://openalex.org/W2158234032","https://openalex.org/W2159991108","https://openalex.org/W2165949176","https://openalex.org/W2169393274","https://openalex.org/W2194775991","https://openalex.org/W2214124602","https://openalex.org/W2307770531","https://openalex.org/W2339712187","https://openalex.org/W2579549467","https://openalex.org/W2581887665","https://openalex.org/W2606780347","https://openalex.org/W2737106217","https://openalex.org/W2779991293","https://openalex.org/W2789158025","https://openalex.org/W2798734012","https://openalex.org/W2801004733","https://openalex.org/W2808877322","https://openalex.org/W2883697687","https://openalex.org/W2886970679","https://openalex.org/W2888096830","https://openalex.org/W2888814092","https://openalex.org/W2889185481","https://openalex.org/W2896659472","https://openalex.org/W2940963663","https://openalex.org/W2950096400","https://openalex.org/W2950898568","https://openalex.org/W2955882737","https://openalex.org/W2962688385","https://openalex.org/W2962844592","https://openalex.org/W2963097937","https://openalex.org/W2963150697","https://openalex.org/W2963184176","https://openalex.org/W2963536419","https://openalex.org/W2963699792","https://openalex.org/W2963849369","https://openalex.org/W2964016027","https://openalex.org/W2964199361","https://openalex.org/W2964225075","https://openalex.org/W2964241181","https://openalex.org/W2967045987","https://openalex.org/W2970583209","https://openalex.org/W2982147439","https://openalex.org/W2982232158","https://openalex.org/W2984933298","https://openalex.org/W2986953233","https://openalex.org/W2987391422","https://openalex.org/W2988916019","https://openalex.org/W2990599624","https://openalex.org/W2998296459","https://openalex.org/W3004349648","https://openalex.org/W3009224666","https://openalex.org/W3009811369","https://openalex.org/W3021357623","https://openalex.org/W3034230284","https://openalex.org/W3034563158","https://openalex.org/W3034951775","https://openalex.org/W3035180180","https://openalex.org/W3035440494","https://openalex.org/W3035598501","https://openalex.org/W3097096317","https://openalex.org/W3117097536","https://openalex.org/W3173957243","https://openalex.org/W4293651439","https://openalex.org/W4297733535","https://openalex.org/W4299522971","https://openalex.org/W4301141993","https://openalex.org/W6620707391","https://openalex.org/W6632922691","https://openalex.org/W6639102338","https://openalex.org/W6679687845","https://openalex.org/W6680285999","https://openalex.org/W6683323873","https://openalex.org/W6690815549","https://openalex.org/W6736685754","https://openalex.org/W6744557953","https://openalex.org/W6745537798","https://openalex.org/W6746746423","https://openalex.org/W6748822025","https://openalex.org/W6754152559","https://openalex.org/W6764644601","https://openalex.org/W6776491375","https://openalex.org/W6787166195"],"related_works":["https://openalex.org/W4353114450","https://openalex.org/W4387735881","https://openalex.org/W4387735893","https://openalex.org/W2963343840","https://openalex.org/W3131914241","https://openalex.org/W2754155766","https://openalex.org/W4287854977","https://openalex.org/W2769151336","https://openalex.org/W2963192850","https://openalex.org/W3195149243"],"abstract_inverted_index":{"This":[0],"paper":[1],"addresses":[2],"the":[3,15,22,60,70,194],"task":[4],"of":[5,21,59,186],"detecting":[6],"and":[7,18,49,100,126,140,146,152,204,221],"recognizing":[8],"human-object":[9],"interactions":[10],"(HOI)":[11],"in":[12,69,193,197],"images.":[13],"Considering":[14],"intrinsic":[16],"complexity":[17],"structural":[19],"nature":[20],"task,":[23],"we":[24,163],"introduce":[25],"a":[26,32,53,86,112,122,160,176],"cascaded":[27],"parsing":[28,88,143],"network":[29,90],"(CP-HOI)":[30],"for":[31,104],"multi-stage,":[33],"structured":[34,54,79],"HOI":[35,47,96,119,144,148,216],"understanding.":[36,107],"At":[37],"each":[38],"cascade":[39],"stage,":[40,72],"an":[41,133],"instance":[42,151],"detection":[43,158,203],"module":[44,82],"progressively":[45],"refines":[46],"proposals":[48],"feeds":[50],"them":[51],"into":[52,179],"interaction":[55,80],"reasoning":[56,81,147],"module.":[57],"Each":[58],"two":[61,214],"modules":[62],"is":[63,83],"also":[64],"connected":[65],"to":[66,168],"its":[67],"predecessor":[68],"previous":[71],"enabling":[73],"efficient":[74],"cross-stage":[75],"information":[76],"propagation.":[77],"The":[78],"built":[84],"upon":[85],"graph":[87,114],"neural":[89],"(GPNN),":[91],"which":[92],"efficiently":[93],"models":[94],"potential":[95],"structures":[97,120,145],"as":[98],"graphs":[99],"mines":[101],"rich":[102],"context":[103],"comprehensive":[105],"relation":[106,153,157,172,181,202],"In":[108,206],"particular,":[109],"GPNN":[110,137],"infers":[111],"parse":[113],"that":[115],"i)":[116],"interprets":[117],"meaningful":[118],"by":[121],"learnable":[123],"adjacency":[124],"matrix,":[125],"ii)":[127],"predicts":[128],"action":[129],"(edge)":[130],"labels.":[131],"Within":[132],"end-to-end,":[134],"message-passing":[135],"framework,":[136],"blends":[138],"learning":[139],"inference,":[141],"iteratively":[142],"representations":[149],"(i.e.,":[150],"features).":[154],"Further":[155],"beyond":[156],"at":[159],"bounding-box":[161],"level,":[162],"make":[164],"our":[165,187,208],"framework":[166],"flexible":[167],"perform":[169],"fine-grained":[170],"pixel-wise":[171],"segmentation;":[173],"this":[174],"provides":[175],"new":[177],"glimpse":[178],"better":[180],"modeling.":[182],"A":[183],"preliminary":[184],"version":[185],"CP-HOI":[188,209],"model":[189],"reached":[190],"1<sup>st</sup>":[191],"place":[192],"ICCV2019":[195],"Person":[196],"Context":[198],"Challenge,":[199],"on":[200,213],"both":[201],"segmentation.":[205],"addition,":[207],"shows":[210],"promising":[211],"results":[212],"popular":[215],"recognition":[217],"benchmarks,":[218],"i.e.,":[219],"V-COCO":[220],"HICO-DET.":[222]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":24},{"year":2022,"cited_by_count":32},{"year":2021,"cited_by_count":30}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
