{"id":"https://openalex.org/W3189076762","doi":"https://doi.org/10.1109/tmm.2021.3104411","title":"Relation-Aware Compositional Zero-Shot Learning for Attribute-Object Pair Recognition","display_name":"Relation-Aware Compositional Zero-Shot Learning for Attribute-Object Pair Recognition","publication_year":2021,"publication_date":"2021-08-13","ids":{"openalex":"https://openalex.org/W3189076762","doi":"https://doi.org/10.1109/tmm.2021.3104411","mag":"3189076762"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2021.3104411","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3104411","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2108.04603","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Ziwei Xu","orcid":"https://orcid.org/0000-0003-0600-2579"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Ziwei Xu","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-0600-2579","affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Guangzhi Wang","orcid":"https://orcid.org/0000-0002-5036-4051"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Guangzhi Wang","raw_affiliation_strings":["NUS Graduate School for Integrative Sciences &amp; Engineering, National University of Singapore, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-5036-4051","affiliations":[{"raw_affiliation_string":"NUS Graduate School for Integrative Sciences &amp; Engineering, National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yongkang Wong","orcid":"https://orcid.org/0000-0002-1239-4428"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yongkang Wong","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-1239-4428","affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":null,"display_name":"Mohan S. Kankanhalli","orcid":"https://orcid.org/0000-0002-4846-2015"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Mohan S. Kankanhalli","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-4846-2015","affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":1.6798,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.8701276,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"24","issue":null,"first_page":"3652","last_page":"3664"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9319999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9319999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.01209999993443489,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.009499999694526196,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5626000165939331},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4293000102043152},{"id":"https://openalex.org/keywords/blocking","display_name":"Blocking (statistics)","score":0.4291999936103821},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.40700000524520874},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.382999986410141},{"id":"https://openalex.org/keywords/message-passing","display_name":"Message passing","score":0.3806999921798706},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.3628999888896942},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.3425000011920929},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.31189998984336853}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8745999932289124},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5626000165939331},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5273000001907349},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4293000102043152},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.4291999936103821},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.40700000524520874},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.382999986410141},{"id":"https://openalex.org/C854659","wikidata":"https://www.wikidata.org/wiki/Q1859284","display_name":"Message passing","level":2,"score":0.3806999921798706},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3628999888896942},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3476000130176544},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3425000011920929},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.31189998984336853},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2922999858856201},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.28630000352859497},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.25870001316070557},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25769999623298645},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2526000142097473}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tmm.2021.3104411","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3104411","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2108.04603","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.04603","pdf_url":"https://arxiv.org/pdf/2108.04603","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2108.04603","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.04603","pdf_url":"https://arxiv.org/pdf/2108.04603","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":83,"referenced_works":["https://openalex.org/W64813323","https://openalex.org/W841113906","https://openalex.org/W1948251820","https://openalex.org/W1967053063","https://openalex.org/W1969616664","https://openalex.org/W2049705550","https://openalex.org/W2050964073","https://openalex.org/W2052530028","https://openalex.org/W2063386797","https://openalex.org/W2064851185","https://openalex.org/W2093848332","https://openalex.org/W2098411764","https://openalex.org/W2105482032","https://openalex.org/W2106833577","https://openalex.org/W2109317801","https://openalex.org/W2123695991","https://openalex.org/W2157423479","https://openalex.org/W2181378550","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2270070752","https://openalex.org/W2289084343","https://openalex.org/W2289324734","https://openalex.org/W2294130536","https://openalex.org/W2346746376","https://openalex.org/W2400717490","https://openalex.org/W2413794162","https://openalex.org/W2441043183","https://openalex.org/W2464503653","https://openalex.org/W2508457857","https://openalex.org/W2594270457","https://openalex.org/W2611406568","https://openalex.org/W2611632661","https://openalex.org/W2724492314","https://openalex.org/W2736809457","https://openalex.org/W2740982616","https://openalex.org/W2777926144","https://openalex.org/W2888096830","https://openalex.org/W2889167066","https://openalex.org/W2904378456","https://openalex.org/W2905449860","https://openalex.org/W2924476266","https://openalex.org/W2955882737","https://openalex.org/W2963149653","https://openalex.org/W2963431581","https://openalex.org/W2963448850","https://openalex.org/W2963486920","https://openalex.org/W2963499153","https://openalex.org/W2963955422","https://openalex.org/W2963960318","https://openalex.org/W2963989815","https://openalex.org/W2967045987","https://openalex.org/W2976669726","https://openalex.org/W2976818183","https://openalex.org/W2981648435","https://openalex.org/W2981774933","https://openalex.org/W2981963155","https://openalex.org/W2982863468","https://openalex.org/W2986385672","https://openalex.org/W2987391422","https://openalex.org/W2991813857","https://openalex.org/W3004319625","https://openalex.org/W3014225712","https://openalex.org/W3025689158","https://openalex.org/W3034727271","https://openalex.org/W3035084814","https://openalex.org/W3035655772","https://openalex.org/W3092962760","https://openalex.org/W3096741441","https://openalex.org/W3097309192","https://openalex.org/W3114005958","https://openalex.org/W3119381934","https://openalex.org/W3143107425","https://openalex.org/W6638318767","https://openalex.org/W6640036494","https://openalex.org/W6640963894","https://openalex.org/W6714181750","https://openalex.org/W6739901393","https://openalex.org/W6755207826","https://openalex.org/W6765549164","https://openalex.org/W6766904570","https://openalex.org/W6769311773","https://openalex.org/W6780184713"],"related_works":[],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"a":[3,132],"novel":[4],"model":[5,21,64,114,142],"for":[6,14,45,76,86,143],"recognizing":[7],"images":[8],"with":[9],"composite":[10,15,120],"attribute-object":[11,50],"concepts,":[12,78],"notably":[13],"concepts":[16,47,121],"that":[17,48,135],"are":[18],"unseen":[19,147],"during":[20],"training.":[22],"We":[23],"aim":[24],"to":[25,103,111,140],"explore":[26],"the":[27,33,57,80,100,105,113,124,137,141,158,161],"three":[28],"key":[29],"properties":[30],"required":[31],"by":[32],"task":[34],"&#x2014;":[35],"relation-aware,":[36],"consistent,":[37],"and":[38,42,88,122,128,146,151],"decoupled&#x2014;to":[39],"learn":[40],"rich":[41],"robust":[43],"features":[44,75,85],"primitive":[46,77,108],"compose":[49],"pairs.":[51],"To":[52],"this":[53],"end,":[54],"we":[55,130],"propose":[56,131],"Blocked":[58],"Message":[59],"Passing":[60],"Network":[61],"(BMP-Net).":[62],"The":[63,69],"consists":[65],"of":[66,160],"two":[67,155],"modules.":[68],"concept":[70,101],"module":[71,82,102],"generates":[72],"semantically":[73],"meaningful":[74],"whereas":[79],"visual":[81,84],"extracts":[83],"attributes":[87,127],"objects":[89],"from":[90,115],"input":[91],"images.":[92],"A":[93],"message":[94],"passing":[95],"mechanism":[96,134],"is":[97],"used":[98],"in":[99],"capture":[104],"relations":[106],"between":[107,126],"concepts.":[109,148],"Furthermore,":[110],"prevent":[112],"being":[116],"biased":[117],"towards":[118],"seen":[119,145],"reduce":[123],"entanglement":[125],"objects,":[129],"blocking":[133],"equalizes":[136],"information":[138],"available":[139],"both":[144],"Extensive":[149],"experiments":[150],"ablation":[152],"studies":[153],"on":[154],"benchmarks":[156],"show":[157],"efficacy":[159],"proposed":[162],"model.":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2021-08-16T00:00:00"}
