{"id":"https://openalex.org/W2981471572","doi":"https://doi.org/10.1145/3343031.3351081","title":"Towards Optimal CNN Descriptors for Large-Scale Image Retrieval","display_name":"Towards Optimal CNN Descriptors for Large-Scale Image Retrieval","publication_year":2019,"publication_date":"2019-10-15","ids":{"openalex":"https://openalex.org/W2981471572","doi":"https://doi.org/10.1145/3343031.3351081","mag":"2981471572"},"language":"en","primary_location":{"id":"doi:10.1145/3343031.3351081","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3351081","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110860223","display_name":"Yinzheng Gu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099297","display_name":"Jilian Technology Group (China)","ror":"https://ror.org/016q5ce10","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210099297"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yinzheng Gu","raw_affiliation_strings":["Jilian Technology Group (Video++) &amp; Fudan-Jilian Joint Research Center of Intelligent Video Technology Shanghai, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Jilian Technology Group (Video++) &amp; Fudan-Jilian Joint Research Center of Intelligent Video Technology Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I4210099297"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039336788","display_name":"Chuanpeng Li","orcid":"https://orcid.org/0000-0003-1804-9032"},"institutions":[{"id":"https://openalex.org/I4210099297","display_name":"Jilian Technology Group (China)","ror":"https://ror.org/016q5ce10","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210099297"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuanpeng Li","raw_affiliation_strings":["Jilian Technology Group (Video++) &amp; Fudan-Jilian Joint Research Center of Intelligent Video Technology Shanghai, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Jilian Technology Group (Video++) &amp; Fudan-Jilian Joint Research Center of Intelligent Video Technology Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I4210099297"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047962986","display_name":"Yu\u2013Gang Jiang","orcid":"https://orcid.org/0000-0002-1907-8567"},"institutions":[{"id":"https://openalex.org/I4210099297","display_name":"Jilian Technology Group (China)","ror":"https://ror.org/016q5ce10","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210099297"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Gang Jiang","raw_affiliation_strings":["Jilian Technology Group (Video++) &amp; Fudan-Jilian Joint Research Center of Intelligent Video Technology Shanghai, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Jilian Technology Group (Video++) &amp; Fudan-Jilian Joint Research Center of Intelligent Video Technology Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I4210099297"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110860223"],"corresponding_institution_ids":["https://openalex.org/I4210099297"],"apc_list":null,"apc_paid":null,"fwci":0.4049,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.6591646,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1768","last_page":"1776"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8445490598678589},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.7687267661094666},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6609282493591309},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.61009281873703},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5687004923820496},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5565876364707947},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5216001272201538},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4459373950958252},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43433406949043274},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4176390767097473},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.417126327753067},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.41501137614250183}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8445490598678589},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.7687267661094666},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6609282493591309},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.61009281873703},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5687004923820496},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5565876364707947},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5216001272201538},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4459373950958252},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43433406949043274},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4176390767097473},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.417126327753067},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.41501137614250183},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3343031.3351081","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3351081","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W204268067","https://openalex.org/W1524680991","https://openalex.org/W1533861849","https://openalex.org/W1679894842","https://openalex.org/W1833123814","https://openalex.org/W1972378554","https://openalex.org/W1976591483","https://openalex.org/W1979931042","https://openalex.org/W1984309565","https://openalex.org/W2003340926","https://openalex.org/W2062118960","https://openalex.org/W2071027807","https://openalex.org/W2100398441","https://openalex.org/W2117539524","https://openalex.org/W2131846894","https://openalex.org/W2141362318","https://openalex.org/W2148809531","https://openalex.org/W2151103935","https://openalex.org/W2163605009","https://openalex.org/W2174726731","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2295537791","https://openalex.org/W2340690086","https://openalex.org/W2531409750","https://openalex.org/W2544587078","https://openalex.org/W2549139847","https://openalex.org/W2559091987","https://openalex.org/W2604652497","https://openalex.org/W2883134734","https://openalex.org/W2898885550","https://openalex.org/W2899771611","https://openalex.org/W2963125676","https://openalex.org/W2963446712","https://openalex.org/W2964121744","https://openalex.org/W2964157791","https://openalex.org/W2964350391"],"related_works":["https://openalex.org/W2383111961","https://openalex.org/W2365952365","https://openalex.org/W2352448290","https://openalex.org/W2380820513","https://openalex.org/W2913146933","https://openalex.org/W2372385138","https://openalex.org/W4296359239","https://openalex.org/W2101155126","https://openalex.org/W2043093291","https://openalex.org/W2363545964"],"abstract_inverted_index":{"Instance-level":[0],"image":[1],"retrieval":[2,69,127,158],"is":[3,38,58],"a":[4,19,23,63,73,94,100,111,116,148,189],"long-standing":[5],"and":[6,22,44,79,103,129,142,153,163,173,184],"challenging":[7,143],"problem":[8],"in":[9,108],"multimedia.":[10],"Recently,":[11],"fine-tuning":[12,125],"Convolutional":[13],"Neural":[14],"Networks":[15],"(CNNs)":[16],"has":[17],"become":[18],"promising":[20],"direction,":[21],"number":[24],"of":[25,55,66,97],"successful":[26],"strategies":[27],"based":[28],"on":[29,99,156],"global":[30],"CNN":[31],"descriptors":[32],"have":[33],"been":[34],"proposed.":[35],"However,":[36],"it":[37],"difficult":[39],"to":[40,48,193],"make":[41],"direct":[42],"comparisons":[43],"draw":[45],"conclusions":[46],"due":[47],"different":[49,90],"settings":[50],"and/or":[51],"datasets.":[52],"The":[53],"goal":[54],"this":[56],"paper":[57],"two-fold.":[59],"Firstly,":[60],"we":[61,114,146,175],"present":[62],"unified":[64],"implementation":[65],"modern":[67],"global-CNN-based":[68],"systems,":[70],"break":[71],"such":[72,110,160],"system":[74],"into":[75],"six":[76],"major":[77],"components,":[78],"investigate":[80],"each":[81],"part":[82],"individually":[83],"as":[84,86,161,165,167],"well":[85,166],"globally":[87],"when":[88],"considering":[89],"configurations.":[91],"We":[92],"conduct":[93],"systematic":[95],"series":[96],"experiments":[98],"component-by-component":[101],"basis":[102],"find":[104],"an":[105],"optimal":[106],"solution":[107],"designing":[109],"system.":[112],"Secondly,":[113],"introduce":[115],"novel":[117],"joint":[118],"loss":[119],"function":[120],"with":[121,131],"learnable":[122],"parameter":[123],"for":[124,126,150],"tasks":[128],"show,":[130],"extensive":[132],"experiments,":[133],"significant":[134],"improvement":[135],"over":[136],"previous":[137],"works.":[138],"On":[139],"the":[140],"new":[141],"large-scale":[144],"Google-Landmarks-Dataset,":[145],"set":[147],"baseline":[149],"future":[151],"research":[152],"comparisons,":[154],"while":[155],"traditional":[157],"benchmarks":[159],"Oxford5k":[162],"Paris6k,":[164],"their":[168],"recent":[169],"revised":[170],"versions":[171],"ROxford5k":[172],"RParis6k,":[174],"achieve":[176],"state-of-the-art":[177],"performance":[178],"under":[179],"all":[180],"three":[181],"(Easy,":[182],"Medium,":[183],"Hard)":[185],"evaluation":[186],"protocals":[187],"by":[188],"large":[190],"margin":[191],"compared":[192],"competing":[194],"methods.":[195]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
