{"id":"https://openalex.org/W2963367015","doi":"https://doi.org/10.1109/vcip.2017.8305144","title":"Clothing retrieval with visual attention model","display_name":"Clothing retrieval with visual attention model","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2963367015","doi":"https://doi.org/10.1109/vcip.2017.8305144","mag":"2963367015"},"language":"en","primary_location":{"id":"doi:10.1109/vcip.2017.8305144","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip.2017.8305144","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101635342","display_name":"Zhonghao Wang","orcid":"https://orcid.org/0000-0002-4650-6395"},"institutions":[{"id":"https://openalex.org/I4210099312","display_name":"Shandong Jiaotong University","ror":"https://ror.org/01848hk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099312"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhonghao Wang","raw_affiliation_strings":["Cooperative Medianet Innovation Center, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Cooperative Medianet Innovation Center, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210099312","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074390218","display_name":"Yujun Gu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099312","display_name":"Shandong Jiaotong University","ror":"https://ror.org/01848hk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099312"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yujun Gu","raw_affiliation_strings":["Cooperative Medianet Innovation Center, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Cooperative Medianet Innovation Center, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210099312","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100342828","display_name":"Ya Zhang","orcid":"https://orcid.org/0000-0002-5390-9053"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I4210099312","display_name":"Shandong Jiaotong University","ror":"https://ror.org/01848hk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099312"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ya Zhang","raw_affiliation_strings":["Cooperative Medianet Innovation Center, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Cooperative Medianet Innovation Center, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I4210099312","https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045140292","display_name":"Jun Zhou","orcid":"https://orcid.org/0000-0001-6033-6102"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Zhou","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028704757","display_name":"Xiao Gu","orcid":"https://orcid.org/0000-0002-3015-5818"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Gu","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101635342"],"corresponding_institution_ids":["https://openalex.org/I183067930","https://openalex.org/I4210099312"],"apc_list":null,"apc_paid":null,"fwci":2.0935,"has_fulltext":false,"cited_by_count":58,"citation_normalized_percentile":{"value":0.92849817,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9799000024795532,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9767000079154968,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7926558256149292},{"id":"https://openalex.org/keywords/clothing","display_name":"Clothing","score":0.701896071434021},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.696281909942627},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6649545431137085},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6348490715026855},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5899401307106018},{"id":"https://openalex.org/keywords/landmark","display_name":"Landmark","score":0.5718326568603516},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5630670785903931},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.5544405579566956},{"id":"https://openalex.org/keywords/connection","display_name":"Connection (principal bundle)","score":0.48808753490448},{"id":"https://openalex.org/keywords/visual-word","display_name":"Visual Word","score":0.46326592564582825},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4457401633262634},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41599223017692566},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3806847631931305},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.33680933713912964},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33046191930770874},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2378811538219452},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07576367259025574}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7926558256149292},{"id":"https://openalex.org/C530175646","wikidata":"https://www.wikidata.org/wiki/Q11460","display_name":"Clothing","level":2,"score":0.701896071434021},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.696281909942627},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6649545431137085},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6348490715026855},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5899401307106018},{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.5718326568603516},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5630670785903931},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.5544405579566956},{"id":"https://openalex.org/C13355873","wikidata":"https://www.wikidata.org/wiki/Q2920850","display_name":"Connection (principal bundle)","level":2,"score":0.48808753490448},{"id":"https://openalex.org/C189391414","wikidata":"https://www.wikidata.org/wiki/Q7936579","display_name":"Visual Word","level":4,"score":0.46326592564582825},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4457401633262634},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41599223017692566},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3806847631931305},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33680933713912964},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33046191930770874},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2378811538219452},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07576367259025574},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/vcip.2017.8305144","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip.2017.8305144","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1903029394","https://openalex.org/W1904365287","https://openalex.org/W2096733369","https://openalex.org/W2097117768","https://openalex.org/W2121339428","https://openalex.org/W2194775991","https://openalex.org/W2200092826","https://openalex.org/W2395611524","https://openalex.org/W2471768434","https://openalex.org/W2576990223","https://openalex.org/W3099206234","https://openalex.org/W6637373629","https://openalex.org/W6640036494","https://openalex.org/W6687483927"],"related_works":["https://openalex.org/W2063218608","https://openalex.org/W4386105885","https://openalex.org/W2184288218","https://openalex.org/W2947282851","https://openalex.org/W2374066281","https://openalex.org/W4387423606","https://openalex.org/W2071180033","https://openalex.org/W2036058638","https://openalex.org/W2528082075","https://openalex.org/W155590726"],"abstract_inverted_index":{"Clothing":[0],"retrieval":[1,21,130],"is":[2,60,91],"a":[3,28,34,76,95],"challenging":[4],"problem":[5],"in":[6,39],"computer":[7],"vision.":[8],"With":[9],"the":[10,17,40,56,111,115,119,135,138,147,151,155],"advance":[11],"of":[12,19,36,42,137,163],"Convolutional":[13],"Neural":[14],"Networks":[15],"(CNNs),":[16],"accuracy":[18],"clothing":[20,45,87,129],"has":[22],"been":[23],"significantly":[24],"improved.":[25],"FashionNet":[26],"[1],":[27],"recent":[29],"study,":[30],"proposes":[31],"to":[32,50,69,82,94,98,146],"employ":[33],"set":[35],"artificial":[37],"features":[38],"form":[41,99],"landmarks":[43],"for":[44,53],"retrieval,":[46],"which":[47,65,107],"are":[48,166],"shown":[49],"be":[51],"helpful":[52],"retrieval.":[54],"However,":[55],"landmark":[57],"detection":[58],"module":[59],"trained":[61],"with":[62,114],"strong":[63],"supervision":[64],"requires":[66],"considerable":[67],"efforts":[68],"obtain.":[70],"In":[71],"this":[72],"paper,":[73],"we":[74],"propose":[75],"self-learning":[77],"Visual":[78],"Attention":[79],"Model":[80],"(VAM)":[81],"extracts":[83],"attention":[84,120],"maps":[85,113],"from":[86],"images.":[88],"The":[89],"VAM":[90],"further":[92],"connected":[93],"global":[96],"network":[97,102,156],"an":[100],"end-to-end":[101],"structure":[103,157],"through":[104],"Impdrop":[105,152],"connection":[106,153],"randomly":[108],"Dropout":[109],"on":[110,124],"feature":[112],"probabilities":[116],"given":[117],"by":[118],"map.":[121],"Extensive":[122],"experiments":[123],"several":[125],"widely":[126],"used":[127],"benchmark":[128],"data":[131],"sets":[132,162],"have":[133],"demonstrated":[134],"promise":[136],"proposed":[139],"method.":[140],"We":[141],"also":[142],"show":[143],"that":[144],"compared":[145],"trivial":[148],"Product":[149],"connection,":[150],"makes":[154],"more":[158],"robust":[159],"when":[160],"training":[161],"limited":[164],"size":[165],"used.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":12},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
