{"id":"https://openalex.org/W2981660636","doi":"https://doi.org/10.1145/3343031.3350921","title":"Hierarchical Visual Relationship Detection","display_name":"Hierarchical Visual Relationship Detection","publication_year":2019,"publication_date":"2019-10-15","ids":{"openalex":"https://openalex.org/W2981660636","doi":"https://doi.org/10.1145/3343031.3350921","mag":"2981660636"},"language":"en","primary_location":{"id":"doi:10.1145/3343031.3350921","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3350921","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101441137","display_name":"Xu Sun","orcid":"https://orcid.org/0000-0001-8241-9320"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xu Sun","raw_affiliation_strings":["Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070294325","display_name":"Yuan Zi","orcid":"https://orcid.org/0000-0002-4723-538X"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Zi","raw_affiliation_strings":["Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084591510","display_name":"Tongwei Ren","orcid":"https://orcid.org/0000-0003-3092-424X"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tongwei Ren","raw_affiliation_strings":["Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035112538","display_name":"Jinhui Tang","orcid":"https://orcid.org/0000-0001-9008-222X"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinhui Tang","raw_affiliation_strings":["Nanjing University of Science and Technology, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101546753","display_name":"Gangshan Wu","orcid":"https://orcid.org/0000-0003-1391-1762"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gangshan Wu","raw_affiliation_strings":["Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101441137"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":0.5061,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.69711684,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"94","last_page":"102"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.714601993560791},{"id":"https://openalex.org/keywords/predicate","display_name":"Predicate (mathematical logic)","score":0.7072783708572388},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.6523807048797607},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6130653023719788},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.518444299697876},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5117368698120117},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.463419109582901},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3406524658203125}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.714601993560791},{"id":"https://openalex.org/C140146324","wikidata":"https://www.wikidata.org/wiki/Q1144319","display_name":"Predicate (mathematical logic)","level":2,"score":0.7072783708572388},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.6523807048797607},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6130653023719788},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.518444299697876},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5117368698120117},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.463419109582901},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3406524658203125},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3343031.3350921","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3350921","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7599999904632568,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W64813323","https://openalex.org/W639708223","https://openalex.org/W1498158520","https://openalex.org/W1536680647","https://openalex.org/W1933349210","https://openalex.org/W1959000896","https://openalex.org/W1974907760","https://openalex.org/W2049705550","https://openalex.org/W2081580037","https://openalex.org/W2089060621","https://openalex.org/W2105101328","https://openalex.org/W2108598243","https://openalex.org/W2135166986","https://openalex.org/W2143017621","https://openalex.org/W2157065343","https://openalex.org/W2277195237","https://openalex.org/W2340690086","https://openalex.org/W2479423890","https://openalex.org/W2525579820","https://openalex.org/W2556388456","https://openalex.org/W2570343428","https://openalex.org/W2579549467","https://openalex.org/W2591644541","https://openalex.org/W2604254608","https://openalex.org/W2607855566","https://openalex.org/W2765137706","https://openalex.org/W2777602943","https://openalex.org/W2788537604","https://openalex.org/W2789177853","https://openalex.org/W2799029629","https://openalex.org/W2883170015","https://openalex.org/W2886970679","https://openalex.org/W2887029921","https://openalex.org/W2889811054","https://openalex.org/W2890531016","https://openalex.org/W2936758701","https://openalex.org/W2950133940","https://openalex.org/W2950577311","https://openalex.org/W2962737704","https://openalex.org/W2963536419","https://openalex.org/W2963649796","https://openalex.org/W2963650529","https://openalex.org/W2963980128","https://openalex.org/W3005285208","https://openalex.org/W4252959399"],"related_works":["https://openalex.org/W2353179089","https://openalex.org/W2923538289","https://openalex.org/W2353125546","https://openalex.org/W2470643824","https://openalex.org/W2349635380","https://openalex.org/W4353089801","https://openalex.org/W2353819554","https://openalex.org/W2359488321","https://openalex.org/W2389866386","https://openalex.org/W2131379912"],"abstract_inverted_index":{"Acting":[0],"as":[1],"a":[2,56,104],"bridge":[3],"between":[4],"vision":[5],"and":[6,16,112,130,147,157],"language,":[7],"visual":[8,62,122],"relationship":[9,24,39,63,73,152],"detection":[10,64,111],"(VRD)":[11],"aims":[12],"to":[13,160,173],"represent":[14],"objects":[15],"their":[17],"interactions":[18],"in":[19,42,97],"an":[20],"image":[21,48,82],"with":[22,69,134],"several":[23],"triplets.":[25],"Nevertheless,":[26],"the":[27,35,76,80,91,120,140,151,174],"conventional":[28],"VRD":[29,58,156],"task":[30,59],"shows":[31],"little":[32],"consideration":[33],"for":[34,47,143],"penalization":[36],"of":[37,79,94,108,155],"incorrect":[38],"predictions,":[40],"which":[41,66],"turn":[43],"undermines":[44],"its":[45],"support":[46],"understanding":[49],"applications.":[50],"In":[51],"this":[52],"paper,":[53],"we":[54,102],"propose":[55,103,139],"novel":[57],"named":[60],"hierarchical":[61,109,113,121,161],"(HVRD),":[65],"encourages":[67],"predictions":[68],"abstract":[70],"yet":[71],"compatible":[72],"triplets":[74],"when":[75],"confidence":[77],"level":[78],"specific":[81],"content":[83],"is":[84,171],"relatively":[85],"low.":[86],"Meanwhile,":[87],"HVRD":[88,105,144],"can":[89,117],"handle":[90],"inevitable":[92],"ambiguity":[93],"groundtruth":[95],"annotation":[96],"VRD.":[98],"Based":[99],"on":[100],"this,":[101],"method,":[106],"consisting":[107],"object":[110,127],"predicate":[114,131],"detection.":[115],"It":[116],"effectively":[118],"detect":[119],"relationships":[123],"by":[124,149],"exploiting":[125],"both":[126],"concept":[128,132],"hierarchy":[129,133],"order":[135],"embedding.":[136],"We":[137],"also":[138],"first":[141],"datasets":[142,159],"evaluation,":[145],"H-VRD":[146],"H-VG,":[148],"expanding":[150],"category":[153],"spaces":[154],"VG":[158],"ones":[162],"respectively.":[163],"The":[164],"experimental":[165],"results":[166],"show":[167],"that":[168],"our":[169],"method":[170],"superior":[172],"state-of-the-art":[175],"baselines.":[176]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
