{"id":"https://openalex.org/W2295830240","doi":"https://doi.org/10.1109/icip.2015.7351684","title":"Hierarchical multi-VLAD for image retrieval","display_name":"Hierarchical multi-VLAD for image retrieval","publication_year":2015,"publication_date":"2015-09-01","ids":{"openalex":"https://openalex.org/W2295830240","doi":"https://doi.org/10.1109/icip.2015.7351684","mag":"2295830240"},"language":"en","primary_location":{"id":"doi:10.1109/icip.2015.7351684","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip.2015.7351684","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100650009","display_name":"Yitong Wang","orcid":"https://orcid.org/0000-0002-7559-4152"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yitong Wang","raw_affiliation_strings":["Cooperative Medianet Innovation Center, Shanghai, China","Institute of Digital Media, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Cooperative Medianet Innovation Center, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Institute of Digital Media, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024879728","display_name":"Ling\u2010Yu Duan","orcid":"https://orcid.org/0000-0002-4491-2023"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ling-Yu Duan","raw_affiliation_strings":["Institute of Digital Media, School of EE&CS, Peking University, Beijing, Beijing, CN"],"affiliations":[{"raw_affiliation_string":"Institute of Digital Media, School of EE&CS, Peking University, Beijing, Beijing, CN","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030005076","display_name":"Jie Lin","orcid":"https://orcid.org/0000-0002-8971-0660"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Jie Lin","raw_affiliation_strings":["Institute for Infocomm Research, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, Singapore","institution_ids":["https://openalex.org/I3005327000"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100407602","display_name":"Zhe Wang","orcid":"https://orcid.org/0000-0002-1385-9012"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhe Wang","raw_affiliation_strings":["Cooperative Medianet Innovation Center, Shanghai, China","Institute of Digital Media, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Cooperative Medianet Innovation Center, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Institute of Digital Media, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058066577","display_name":"Tiejun Huang","orcid":"https://orcid.org/0000-0002-4234-6099"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tiejun Huang","raw_affiliation_strings":["Cooperative Medianet Innovation Center, Shanghai, China","Institute of Digital Media, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Cooperative Medianet Innovation Center, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Institute of Digital Media, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100650009"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.7994,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.8044409,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"4629","last_page":"4633"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/centroid","display_name":"Centroid","score":0.6596242189407349},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6399644017219543},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6324743628501892},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6037552356719971},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6018149852752686},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.6005503535270691},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5718233585357666},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.5529732704162598},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.501708984375},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.49788522720336914},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.4964945912361145},{"id":"https://openalex.org/keywords/scale-invariant-feature-transform","display_name":"Scale-invariant feature transform","score":0.4550642967224121},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.42609652876853943},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.42353835701942444},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3289532959461212},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.2602730393409729},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21472841501235962},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.19525986909866333}],"concepts":[{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.6596242189407349},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6399644017219543},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6324743628501892},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6037552356719971},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6018149852752686},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.6005503535270691},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5718233585357666},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.5529732704162598},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.501708984375},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.49788522720336914},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.4964945912361145},{"id":"https://openalex.org/C61265191","wikidata":"https://www.wikidata.org/wiki/Q767770","display_name":"Scale-invariant feature transform","level":3,"score":0.4550642967224121},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.42609652876853943},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.42353835701942444},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3289532959461212},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2602730393409729},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21472841501235962},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.19525986909866333},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip.2015.7351684","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip.2015.7351684","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2015 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.7300000190734863,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1556531089","https://openalex.org/W1608697715","https://openalex.org/W1677409904","https://openalex.org/W1979931042","https://openalex.org/W1984309565","https://openalex.org/W1995922888","https://openalex.org/W2006002369","https://openalex.org/W2012592962","https://openalex.org/W2044284589","https://openalex.org/W2045143396","https://openalex.org/W2068143350","https://openalex.org/W2071027807","https://openalex.org/W2103924867","https://openalex.org/W2105516263","https://openalex.org/W2128017662","https://openalex.org/W2131846894","https://openalex.org/W2144119741","https://openalex.org/W2148809531","https://openalex.org/W2151103935","https://openalex.org/W6633472159","https://openalex.org/W6636371519","https://openalex.org/W6649312870"],"related_works":["https://openalex.org/W3034955165","https://openalex.org/W2094920358","https://openalex.org/W2041448692","https://openalex.org/W2247121321","https://openalex.org/W2391926582","https://openalex.org/W2087391438","https://openalex.org/W1966831329","https://openalex.org/W2316074893","https://openalex.org/W2020188645","https://openalex.org/W2145450927"],"abstract_inverted_index":{"Constructing":[0],"discriminative":[1],"feature":[2],"descriptors":[3],"is":[4,18,39],"crucial":[5],"towards":[6],"effective":[7],"image":[8],"retrieval.":[9],"The":[10],"state-of-the-art":[11,188],"powerful":[12],"global":[13],"descriptor":[14,115,157],"for":[15,61,158,169],"this":[16,103],"purpose":[17],"Vector":[19],"of":[20,28,58,83,89,161,191],"Locally":[21],"Aggregated":[22],"Descriptors":[23],"(VLAD).":[24],"Given":[25],"a":[26,46,107,123,134,155],"set":[27],"local":[29,43],"features":[30,44,60],"(say,":[31],"SIFT)":[32],"extracted":[33],"from":[34,70,142],"an":[35],"image,":[36],"the":[37,55,66,76,81,112,130,162,170,184],"VLAD":[38,131,156],"generated":[40],"by":[41,79],"quantizing":[42],"with":[45,99,133,148],"small":[47],"visual":[48],"vocabulary":[49,84,163],"(64":[50],"to":[51,87,95,110,128,144,167],"512":[52],"centroids),":[53],"aggregating":[54],"residual":[56,68],"statistics":[57],"quantized":[59],"each":[62,71,159],"centroid":[63],"and":[64,117],"concatenating":[65],"aggregated":[67],"vectors":[69],"centroid.":[72],"One":[73],"can":[74],"increase":[75],"search":[77],"accuracy":[78],"increasing":[80],"size":[82],"(from":[85],"hundreds":[86,88],"thousands),":[90],"which,":[91],"however,":[92],"it":[93],"leads":[94],"heavy":[96],"computation":[97,118,132],"cost":[98],"flat":[100],"quantization.":[101],"In":[102],"paper,":[104],"we":[105,150],"propose":[106],"hierarchical":[108,125],"multi-VLAD":[109],"seek":[111],"tradeoff":[113],"between":[114],"discriminability":[116],"complexity.":[119],"We":[120],"build":[121],"up":[122],"tree-structured":[124],"quantization":[126,138,171],"(TSHQ)":[127],"accelerate":[129],"large":[135],"vocabulary.":[136],"As":[137],"error":[139,172],"may":[140],"propagate":[141],"root":[143],"leaf":[145],"node":[146],"(centroid)":[147],"TSHQ,":[149],"introduce":[151],"multi-VLAD,":[152],"which":[153],"constructing":[154],"level":[160],"tree,":[164],"so":[165],"as":[166,196,198],"compensate":[168],"at":[173],"that":[174,183],"level.":[175],"Extensive":[176],"evaluation":[177],"over":[178],"benchmark":[179],"datasets":[180],"has":[181],"shown":[182],"proposed":[185],"approach":[186],"outperforms":[187],"in":[189],"terms":[190],"retrieval":[192],"accuracy,":[193],"fast":[194],"extraction,":[195],"well":[197],"light":[199],"memory":[200],"cost.":[201]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
