{"id":"https://openalex.org/W4384641262","doi":"https://doi.org/10.1145/3539618.3591705","title":"Keyword-Based Diverse Image Retrieval by Semantics-aware Contrastive Learning and Transformer","display_name":"Keyword-Based Diverse Image Retrieval by Semantics-aware Contrastive Learning and Transformer","publication_year":2023,"publication_date":"2023-07-18","ids":{"openalex":"https://openalex.org/W4384641262","doi":"https://doi.org/10.1145/3539618.3591705"},"language":"en","primary_location":{"id":"doi:10.1145/3539618.3591705","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3539618.3591705","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045420812","display_name":"Minyi Zhao","orcid":"https://orcid.org/0000-0001-7720-806X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Minyi Zhao","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100376316","display_name":"Jinpeng Wang","orcid":"https://orcid.org/0000-0002-4352-4897"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinpeng Wang","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053595500","display_name":"Dongliang Liao","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongliang Liao","raw_affiliation_strings":["Tencent Inc., Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Tencent Inc., Guangzhou, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100319145","display_name":"Yiru Wang","orcid":"https://orcid.org/0009-0006-2193-6686"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiru Wang","raw_affiliation_strings":["Tencent Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tencent Inc., Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082530668","display_name":"Huanzhong Duan","orcid":"https://orcid.org/0009-0000-7815-6142"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huanzhong Duan","raw_affiliation_strings":["Tencent Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tencent Inc., Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017862559","display_name":"Shuigeng Zhou","orcid":"https://orcid.org/0000-0002-1949-2768"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuigeng Zhou","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5045420812"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.3611,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.58956219,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1262","last_page":"1272"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7777012586593628},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.7159229516983032},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5606896281242371},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5578643679618835},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5291149020195007},{"id":"https://openalex.org/keywords/relevance-feedback","display_name":"Relevance feedback","score":0.47860878705978394},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.4609461724758148},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.46040213108062744},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.4574306607246399},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3671247065067291},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.18991619348526}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7777012586593628},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.7159229516983032},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5606896281242371},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5578643679618835},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5291149020195007},{"id":"https://openalex.org/C2779532271","wikidata":"https://www.wikidata.org/wiki/Q445558","display_name":"Relevance feedback","level":4,"score":0.47860878705978394},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.4609461724758148},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46040213108062744},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.4574306607246399},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3671247065067291},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.18991619348526},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3539618.3591705","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3539618.3591705","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W8870360","https://openalex.org/W1596649971","https://openalex.org/W1673310716","https://openalex.org/W1963889129","https://openalex.org/W1975692209","https://openalex.org/W1981276685","https://openalex.org/W1984685202","https://openalex.org/W2013535308","https://openalex.org/W2019863495","https://openalex.org/W2063555110","https://openalex.org/W2088884958","https://openalex.org/W2106277773","https://openalex.org/W2112037975","https://openalex.org/W2185175083","https://openalex.org/W2194775991","https://openalex.org/W2398606097","https://openalex.org/W2606965845","https://openalex.org/W2742000522","https://openalex.org/W2765440071","https://openalex.org/W2892181857","https://openalex.org/W2903664715","https://openalex.org/W2946298263","https://openalex.org/W2954793896","https://openalex.org/W2956018683","https://openalex.org/W2963340196","https://openalex.org/W2963389687","https://openalex.org/W2967957126","https://openalex.org/W2981951787","https://openalex.org/W2994818707","https://openalex.org/W2997297138","https://openalex.org/W3016451726","https://openalex.org/W3017267450","https://openalex.org/W3017313555","https://openalex.org/W3034140121","https://openalex.org/W3035256320","https://openalex.org/W3035454331","https://openalex.org/W3035730922","https://openalex.org/W3093002089","https://openalex.org/W3093206850","https://openalex.org/W3093493377","https://openalex.org/W3155865710","https://openalex.org/W3176471072","https://openalex.org/W3176913643","https://openalex.org/W3179442710","https://openalex.org/W3203247393","https://openalex.org/W3205818350","https://openalex.org/W3206019042","https://openalex.org/W3212100893","https://openalex.org/W4212848270","https://openalex.org/W4225774139","https://openalex.org/W4293248850","https://openalex.org/W4304084306","https://openalex.org/W4312980231"],"related_works":["https://openalex.org/W2034539438","https://openalex.org/W1606474234","https://openalex.org/W2124645781","https://openalex.org/W2184057774","https://openalex.org/W2162645796","https://openalex.org/W2543381692","https://openalex.org/W1975659822","https://openalex.org/W3087943932","https://openalex.org/W2391460410","https://openalex.org/W1658719554"],"abstract_inverted_index":{"In":[0],"addition":[1],"to":[2,21,43,49,61,76,90,105,157,198,213,219],"relevance,":[3],"diversity":[4,92,131],"is":[5,19,58,196,211],"an":[6,182],"important":[7],"yet":[8],"less":[9],"studied":[10],"performance":[11],"metric":[12],"of":[13,47,56,117,132,181],"cross-modal":[14,185],"image":[15,28,174],"retrieval":[16,29,35,39,71,223],"systems,":[17],"which":[18,86,126],"critical":[20],"user":[22],"experience.":[23],"Existing":[24],"solutions":[25],"for":[26,165],"diversity-aware":[27,82],"either":[30],"explicitly":[31],"post-process":[32],"the":[33,67,96,128,133,178,201,221,243],"raw":[34],"results":[36,134],"from":[37,216],"standard":[38,70],"systems":[40,72],"or":[41,119],"try":[42],"learn":[44,106],"multi-vector":[45,99],"representations":[46,164,180],"images":[48,114,116,215],"represent":[50],"their":[51,204],"diverse":[52],"semantics.":[53],"However,":[54],"neither":[55],"them":[57],"good":[59],"enough":[60],"balance":[62],"relevance":[63,129],"and":[64,79,115,130,162,232,241],"diversity.":[65],"On":[66,95],"one":[68],"hand,":[69,98],"are":[73,102],"usually":[74],"biased":[75],"common":[77],"semantics":[78,121],"seldom":[80],"exploit":[81],"regularization":[83],"in":[84],"training,":[85],"makes":[87],"it":[88],"difficult":[89],"promote":[91],"by":[93,136,176],"post-processing.":[94],"other":[97],"representation":[100],"methods":[101,245],"not":[103],"guaranteed":[104],"robust":[107,163],"multiple":[108],"projections.":[109],"As":[110],"a":[111,150,192,208,247,250],"result,":[112],"irrelevant":[113],"rare":[118],"unique":[120],"may":[122],"be":[123],"projected":[124],"inappropriately,":[125],"degrades":[127],"generated":[135],"some":[137],"typical":[138],"algorithms":[139],"like":[140],"top-k.":[141],"To":[142],"cope":[143],"with":[144,187],"these":[145],"problems,":[146],"this":[147],"paper":[148],"presents":[149],"new":[151],"method":[152],"called":[153],"CoLT":[154,170,236],"that":[155,235],"tries":[156],"generate":[158],"much":[159],"more":[160],"representative":[161],"accurately":[166],"classifying":[167],"images.":[168],"Specifically,":[169],"first":[171],"extracts":[172],"semantics-aware":[173,188],"features":[175,202],"enhancing":[177],"preliminary":[179],"existing":[183,244],"one-to-one":[184],"system":[186],"contrastive":[189],"learning.":[190],"Then,":[191],"transformer-based":[193],"token":[194],"classifier":[195],"developed":[197],"subsume":[199],"all":[200],"into":[203],"corresponding":[205],"categories.":[206],"Finally,":[207],"post-processing":[209],"algorithm":[210],"designed":[212],"retrieve":[214],"each":[217],"category":[218],"form":[220],"final":[222],"result.":[224],"Extensive":[225],"experiments":[226],"on":[227],"two":[228],"real-world":[229],"datasets":[230],"Div400":[231],"Div150Cred":[233],"show":[234],"can":[237],"effectively":[238],"boost":[239],"diversity,":[240],"outperforms":[242],"as":[246],"whole":[248],"(with":[249],"higher":[251],"F1":[252],"score).":[253]},"counts_by_year":[{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
