{"id":"https://openalex.org/W3210192352","doi":"https://doi.org/10.1145/3475731.3484957","title":"Hierarchical Semantic Enhanced Directional Graph Network for Visual Commonsense Reasoning","display_name":"Hierarchical Semantic Enhanced Directional Graph Network for Visual Commonsense Reasoning","publication_year":2021,"publication_date":"2021-10-22","ids":{"openalex":"https://openalex.org/W3210192352","doi":"https://doi.org/10.1145/3475731.3484957","mag":"3210192352"},"language":"en","primary_location":{"id":"doi:10.1145/3475731.3484957","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3475731.3484957","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Trustworthy AI for Multimedia Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070523720","display_name":"Mingyan Wu","orcid":"https://orcid.org/0000-0003-2610-285X"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mingyan Wu","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050911130","display_name":"Shuhan Qi","orcid":"https://orcid.org/0000-0002-6903-145X"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuhan Qi","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen &amp; PengCheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen &amp; PengCheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793","https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053687590","display_name":"Jun Rao","orcid":"https://orcid.org/0000-0001-5804-1508"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Rao","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100417632","display_name":"Jiajia Zhang","orcid":"https://orcid.org/0000-0001-6611-2046"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiajia Zhang","raw_affiliation_strings":["Harbin Institute of Technology, ShenZhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, ShenZhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069241620","display_name":"Qing Liao","orcid":"https://orcid.org/0000-0003-1012-5301"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Liao","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113968141","display_name":"Xuan Wang","orcid":"https://orcid.org/0009-0005-4952-4619"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuan Wang","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102924671","display_name":"Xinxin Liao","orcid":"https://orcid.org/0000-0002-5761-7832"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinxin Liao","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5070523720"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":0.0961,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.41013072,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"27","last_page":"36"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.8433955907821655},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7737899422645569},{"id":"https://openalex.org/keywords/commonsense-reasoning","display_name":"Commonsense reasoning","score":0.7663213014602661},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6391736268997192},{"id":"https://openalex.org/keywords/commonsense-knowledge","display_name":"Commonsense knowledge","score":0.6231101751327515},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5832207202911377},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.5472722053527832},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.5116634368896484},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.49310705065727234},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3478120267391205},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.2098451554775238},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.13961070775985718}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.8433955907821655},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7737899422645569},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.7663213014602661},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6391736268997192},{"id":"https://openalex.org/C30542707","wikidata":"https://www.wikidata.org/wiki/Q1603203","display_name":"Commonsense knowledge","level":3,"score":0.6231101751327515},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5832207202911377},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.5472722053527832},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.5116634368896484},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.49310705065727234},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3478120267391205},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.2098451554775238},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.13961070775985718}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3475731.3484957","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3475731.3484957","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Trustworthy AI for Multimedia Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1152794872","display_name":null,"funder_award_id":"No.2020A1515010652","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G8932516491","display_name":null,"funder_award_id":"No.61902093","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1501856433","https://openalex.org/W1905882502","https://openalex.org/W1933349210","https://openalex.org/W2116341502","https://openalex.org/W2186222003","https://openalex.org/W2194775991","https://openalex.org/W2277195237","https://openalex.org/W2464305746","https://openalex.org/W2608787653","https://openalex.org/W2745461083","https://openalex.org/W2810482788","https://openalex.org/W2894786240","https://openalex.org/W2904458925","https://openalex.org/W2949831469","https://openalex.org/W2950761309","https://openalex.org/W2962964995","https://openalex.org/W2963115613","https://openalex.org/W2963150162","https://openalex.org/W2963176022","https://openalex.org/W2963318290","https://openalex.org/W2963341956","https://openalex.org/W2963383024","https://openalex.org/W2963925437","https://openalex.org/W2963977738","https://openalex.org/W2966146145","https://openalex.org/W2970927600","https://openalex.org/W3099023595","https://openalex.org/W3118694826","https://openalex.org/W4211225923","https://openalex.org/W4236965008","https://openalex.org/W4301409532"],"related_works":["https://openalex.org/W3035583586","https://openalex.org/W4320165839","https://openalex.org/W2151799802","https://openalex.org/W2196562041","https://openalex.org/W4385488510","https://openalex.org/W2073302931","https://openalex.org/W3021007069","https://openalex.org/W2981750021","https://openalex.org/W4302773889","https://openalex.org/W4398163702"],"abstract_inverted_index":{"Visual":[0],"commonsense":[1,35],"reasoning":[2,137,151,166],"(VCR)":[3],"task":[4],"aims":[5],"at":[6],"boosting":[7],"research":[8],"of":[9,20,23,157,179],"cognition-level":[10],"correlations":[11],"reasoning.":[12,93],"It":[13],"requires":[14],"not":[15],"only":[16],"a":[17,99,113,133,163],"thorough":[18],"understanding":[19],"correlated":[21],"details":[22],"the":[24,28,40,45,55,126,155,176,180,189],"scene":[25],"but":[26],"also":[27],"ability":[29],"to":[30,43,74,90,154,162,174],"infer":[31],"correlation":[32],"with":[33,86,206],"related":[34],"knowledge.":[36],"Existing":[37],"approaches":[38],"consider":[39],"region-word":[41],"affinity":[42],"perform":[44],"semantic":[46,102],"alignment":[47,123],"between":[48],"vision":[49],"and":[50,61,66,202],"linguistic":[51,67],"domains,":[52],"which":[53,119,193],"neglect":[54],"implicit":[56],"correspondence":[57],"(e.g.":[58],"word-scene,":[59],"region-phrase,":[60],"phrase-scene)":[62],"among":[63],"visual":[64],"concepts":[65],"words.":[68],"Although":[69],"efforts":[70],"have":[71,185],"been":[72,186],"made":[73],"deliver":[75],"promising":[76],"results":[77,201],"in":[78,149],"previous":[79],"work,":[80],"these":[81,158],"methods":[82],"are":[83],"still":[84],"confronted":[85],"challenges":[87],"when":[88],"comes":[89],"make":[91],"interpretable":[92,165],"Toward":[94],"this":[95,141],"end,":[96],"we":[97,111,131],"present":[98],"novel":[100],"hierarchical":[101,127],"enhanced":[103],"directional":[104],"graph":[105,136,170],"network.":[106],"To":[107],"be":[108,146],"more":[109,164],"specific,":[110],"design":[112],"Modality":[114],"Interaction":[115],"Unit":[116],"(MIU)":[117],"module,":[118,142],"captures":[120],"high-order":[121],"cross-modal":[122],"by":[124],"aggregating":[125],"vision-language":[128],"relationships.":[129],"Afterward,":[130],"propose":[132],"direction":[134],"clue-aware":[135],"(DCGR)":[138],"module.":[139],"In":[140],"valuable":[143],"entities":[144],"can":[145,198],"dynamically":[147],"selected":[148],"each":[150],"step,":[152],"according":[153],"importance":[156],"entities.":[159],"This":[160],"leads":[161],"procedure.":[167],"Ultimately,":[168],"heterogeneous":[169],"attention":[171],"is":[172],"introduced":[173],"filter":[175],"irrelevant":[177],"parts":[178],"final":[181],"answers.":[182],"Extensive":[183],"experiments":[184],"conducted":[187],"on":[188],"VCR":[190],"benchmark":[191],"dataset,":[192],"demonstrates":[194],"that":[195],"our":[196],"method":[197],"achieve":[199],"competitive":[200],"better":[203],"interpretability":[204],"compared":[205],"several":[207],"state-of-the-art":[208],"baselines.":[209]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
