{"id":"https://openalex.org/W4388190284","doi":"https://doi.org/10.1145/3581783.3612283","title":"Hi-SIGIR: Hierachical Semantic-Guided Image-to-image Retrieval via Scene Graph","display_name":"Hi-SIGIR: Hierachical Semantic-Guided Image-to-image Retrieval via Scene Graph","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4388190284","doi":"https://doi.org/10.1145/3581783.3612283"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612283","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612283","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043749691","display_name":"Yulu Wang","orcid":"https://orcid.org/0009-0009-9854-4885"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yulu Wang","raw_affiliation_strings":["Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0009-9854-4885","affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070078619","display_name":"Pengwen Dai","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengwen Dai","raw_affiliation_strings":["Sun Yat-sen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-6262-982X","affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Shenzhen, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084784341","display_name":"Xiaojun Jia","orcid":"https://orcid.org/0000-0002-2018-9344"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojun Jia","raw_affiliation_strings":["Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2018-9344","affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101855535","display_name":"Zhitao Zeng","orcid":"https://orcid.org/0000-0001-9716-5626"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhitao Zeng","raw_affiliation_strings":["Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-9716-5626","affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102939956","display_name":"Rui Li","orcid":"https://orcid.org/0009-0006-4847-2324"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Li","raw_affiliation_strings":["Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0006-4847-2324","affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences &amp; University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068837264","display_name":"Xiaochun Cao","orcid":"https://orcid.org/0000-0001-7141-708X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaochun Cao","raw_affiliation_strings":["Sun Yat-sen University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-7141-708X","affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Shenzhen, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5043749691"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.471,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65554279,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"6400","last_page":"6409"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.848192572593689},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.6711521744728088},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6059356927871704},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5384663343429565},{"id":"https://openalex.org/keywords/visual-word","display_name":"Visual Word","score":0.5232309699058533},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5176480412483215},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5119229555130005},{"id":"https://openalex.org/keywords/scene-graph","display_name":"Scene graph","score":0.47944679856300354},{"id":"https://openalex.org/keywords/automatic-image-annotation","display_name":"Automatic image annotation","score":0.4688250720500946},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46087533235549927},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.45893049240112305},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.40575453639030457},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33494603633880615},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.15996605157852173}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.848192572593689},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.6711521744728088},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6059356927871704},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5384663343429565},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.5232309699058533},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5176480412483215},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5119229555130005},{"id":"https://openalex.org/C179372163","wikidata":"https://www.wikidata.org/wiki/Q1406181","display_name":"Scene graph","level":3,"score":0.47944679856300354},{"id":"https://openalex.org/C199579030","wikidata":"https://www.wikidata.org/wiki/Q2851778","display_name":"Automatic image annotation","level":4,"score":0.4688250720500946},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46087533235549927},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.45893049240112305},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.40575453639030457},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33494603633880615},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.15996605157852173},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612283","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3581783.3612283","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1536680647","https://openalex.org/W1677409904","https://openalex.org/W1773149199","https://openalex.org/W1861492603","https://openalex.org/W2008857988","https://openalex.org/W2044465660","https://openalex.org/W2059186503","https://openalex.org/W2061283430","https://openalex.org/W2071027807","https://openalex.org/W2077069816","https://openalex.org/W2108598243","https://openalex.org/W2113180829","https://openalex.org/W2125148312","https://openalex.org/W2141362318","https://openalex.org/W2141584146","https://openalex.org/W2148809531","https://openalex.org/W2151103935","https://openalex.org/W2170282673","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2340690086","https://openalex.org/W2535410496","https://openalex.org/W2544587078","https://openalex.org/W2744926832","https://openalex.org/W2752160731","https://openalex.org/W2914885528","https://openalex.org/W2921526458","https://openalex.org/W2925177113","https://openalex.org/W2951019013","https://openalex.org/W2963125676","https://openalex.org/W2963536419","https://openalex.org/W2964157791","https://openalex.org/W2989952597","https://openalex.org/W3010277541","https://openalex.org/W3034302278","https://openalex.org/W3035575176","https://openalex.org/W3096651815","https://openalex.org/W3103523530","https://openalex.org/W3105655001","https://openalex.org/W3107530881","https://openalex.org/W3108274592","https://openalex.org/W3115656231","https://openalex.org/W3136405090","https://openalex.org/W3158091578","https://openalex.org/W3169253336","https://openalex.org/W4226239489","https://openalex.org/W4285412155","https://openalex.org/W4287367114","https://openalex.org/W4312229863","https://openalex.org/W4312959179"],"related_works":["https://openalex.org/W2387268739","https://openalex.org/W2123147980","https://openalex.org/W2168037874","https://openalex.org/W2066590080","https://openalex.org/W2076842684","https://openalex.org/W2918350319","https://openalex.org/W1539573266","https://openalex.org/W4387423606","https://openalex.org/W2513891871","https://openalex.org/W2187873862"],"abstract_inverted_index":{"Image-to-image":[0],"retrieval,":[1],"a":[2,12,45,107,202,208],"fundamental":[3],"task,":[4],"aims":[5],"at":[6,188],"matching":[7],"similar":[8],"images":[9,38,185],"based":[10],"on":[11,218],"query":[13],"image.":[14,132],"Existing":[15],"methods":[16],"with":[17,39],"convolutional":[18],"neural":[19,168],"networks":[20],"are":[21,88,157],"usually":[22],"sensitive":[23],"to":[24,55,76,120,159,165,170,195,211],"low-level":[25],"visual":[26,71,141],"features,":[27],"and":[28,42,64,137,142,148,163,192],"ignore":[29,68],"high-level":[30],"semantic":[31,59,143],"relationship":[32],"information.":[33,173],"This":[34],"makes":[35],"retrieving":[36],"complicated":[37],"multiple":[40],"objects":[41,63],"various":[43],"relationships":[44],"significant":[46],"challenge.":[47],"Although":[48],"some":[49],"works":[50],"introduce":[51,201],"the":[52,57,62,69,77,92,95,127,140,146,151,166,177,180,190,223,226],"scene":[53,115,128,152,181],"graph":[54,129,167],"capture":[56],"global":[58,172,193],"features":[60,144,156],"of":[61,79,94,130,145,183,225],"their":[65],"relations,":[66],"they":[67],"local":[70,161,191],"representations.":[72],"In":[73],"addition,":[74],"due":[75],"fragility":[78],"individual":[80],"modal":[81],"representations,":[82],"poisoning":[83],"attacks":[84],"in":[85,207],"adversarial":[86],"scenarios":[87],"easily":[89],"achieved,":[90],"hurting":[91],"robustness":[93],"visual-guided":[96],"foundation":[97],"image":[98,197,213],"retrieval":[99,112],"model.":[100],"To":[101],"overcome":[102],"these":[103,155,175],"issues,":[104],"we":[105,200],"propose":[106],"novel":[108],"hierarchical":[109],"semantic-guided":[110],"image-to-image":[111],"method":[113,125],"via":[114],"graph,":[116],"called":[117],"Hi-SIGIR.":[118],"Specifically,":[119],"begin":[121],"with,":[122],"our":[123,134],"proposed":[124,227],"generates":[126],"an":[131],"Then,":[133],"model":[135],"extracts":[136],"learns":[138],"both":[139,189],"nodes":[147],"relations":[149],"within":[150],"graphs.":[153],"Next,":[154],"fused":[158],"obtain":[160,171],"information":[162],"sent":[164],"network":[169],"Using":[174],"information,":[176],"similarity":[178],"between":[179],"graphs":[182],"several":[184,219],"is":[186],"calculated":[187],"levels":[194],"perform":[196],"retrieval.":[198],"Finally,":[199],"surrogate":[203],"that":[204],"calculates":[205],"relevance":[206],"cross-modal":[209],"manner":[210],"understand":[212],"content":[214],"better.":[215],"Experimental":[216],"evaluations":[217],"wildly-used":[220],"benchmarks":[221],"demonstrate":[222],"superiority":[224],"method.":[228]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
