{"id":"https://openalex.org/W2061571889","doi":"https://doi.org/10.1109/cvpr.2010.5540046","title":"ARISTA - image search to annotation on billions of web photos","display_name":"ARISTA - image search to annotation on billions of web photos","publication_year":2010,"publication_date":"2010-06-01","ids":{"openalex":"https://openalex.org/W2061571889","doi":"https://doi.org/10.1109/cvpr.2010.5540046","mag":"2061571889"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2010.5540046","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2010.5540046","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101839607","display_name":"Xinjing Wang","orcid":"https://orcid.org/0000-0002-4110-7811"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin-Jing Wang","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China","Microsoft Research Asia, 49 Zhichun Road, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research Asia, 49 Zhichun Road, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100433899","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0002-2078-4215"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China","Microsoft Research Asia, 49 Zhichun Road, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research Asia, 49 Zhichun Road, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100347731","display_name":"Ming Liu","orcid":"https://orcid.org/0000-0001-5138-9640"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ming Liu","raw_affiliation_strings":["One Microsoft Way, Microsoft Corporation, Redmond, USA","Microsoft Corporation, One Microsoft Way, Redmond, U.S.A"],"affiliations":[{"raw_affiliation_string":"One Microsoft Way, Microsoft Corporation, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation, One Microsoft Way, Redmond, U.S.A","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100421473","display_name":"Yi Li","orcid":"https://orcid.org/0000-0002-2856-7290"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Li","raw_affiliation_strings":["One Microsoft Way, Microsoft Corporation, Redmond, USA","Microsoft Corporation, One Microsoft Way, Redmond, U.S.A"],"affiliations":[{"raw_affiliation_string":"One Microsoft Way, Microsoft Corporation, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation, One Microsoft Way, Redmond, U.S.A","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103733614","display_name":"Wei\u2010Ying Ma","orcid":"https://orcid.org/0000-0002-7384-0735"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei-Ying Ma","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China","Microsoft Research Asia, 49 Zhichun Road, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]},{"raw_affiliation_string":"Microsoft Research Asia, 49 Zhichun Road, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101839607"],"corresponding_institution_ids":["https://openalex.org/I4210113369"],"apc_list":null,"apc_paid":null,"fwci":16.8102,"has_fulltext":false,"cited_by_count":90,"citation_normalized_percentile":{"value":0.99408865,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"2987","last_page":"2994"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10689","display_name":"Remote-Sensing Image Classification","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8362733721733093},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.654463529586792},{"id":"https://openalex.org/keywords/automatic-image-annotation","display_name":"Automatic image annotation","score":0.6160100102424622},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5957624316215515},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5313115119934082},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.5263316035270691},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5209356546401978},{"id":"https://openalex.org/keywords/crawling","display_name":"Crawling","score":0.5125577449798584},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.463569700717926},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4597902297973633},{"id":"https://openalex.org/keywords/web-crawler","display_name":"Web crawler","score":0.4430847764015198},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.43036991357803345},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3816072642803192},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3347429633140564},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.27960968017578125}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8362733721733093},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.654463529586792},{"id":"https://openalex.org/C199579030","wikidata":"https://www.wikidata.org/wiki/Q2851778","display_name":"Automatic image annotation","level":4,"score":0.6160100102424622},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5957624316215515},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5313115119934082},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.5263316035270691},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5209356546401978},{"id":"https://openalex.org/C100368936","wikidata":"https://www.wikidata.org/wiki/Q1411725","display_name":"Crawling","level":2,"score":0.5125577449798584},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.463569700717926},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4597902297973633},{"id":"https://openalex.org/C13743948","wikidata":"https://www.wikidata.org/wiki/Q45842","display_name":"Web crawler","level":2,"score":0.4430847764015198},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.43036991357803345},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3816072642803192},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3347429633140564},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.27960968017578125},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C105702510","wikidata":"https://www.wikidata.org/wiki/Q514","display_name":"Anatomy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cvpr.2010.5540046","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2010.5540046","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.181.241","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.181.241","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://research.microsoft.com/en-us/people/xjwang/cvpr10_paper301_arista_final.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1604437383","https://openalex.org/W2038721957","https://openalex.org/W2106485656","https://openalex.org/W2108598243","https://openalex.org/W2110441437","https://openalex.org/W2111976047","https://openalex.org/W2111993661","https://openalex.org/W2117074709","https://openalex.org/W2145072179","https://openalex.org/W2145607950","https://openalex.org/W2150692003","https://openalex.org/W2157465536","https://openalex.org/W2166670710","https://openalex.org/W2171011251","https://openalex.org/W2181691731","https://openalex.org/W3070706509","https://openalex.org/W4235505822","https://openalex.org/W4285719527","https://openalex.org/W6676297131","https://openalex.org/W6681554747","https://openalex.org/W6683169846","https://openalex.org/W7011438494"],"related_works":["https://openalex.org/W2077853975","https://openalex.org/W1501494461","https://openalex.org/W2349057464","https://openalex.org/W2060956679","https://openalex.org/W2072164819","https://openalex.org/W1769740626","https://openalex.org/W1965890413","https://openalex.org/W172077973","https://openalex.org/W2099170935","https://openalex.org/W2052675425"],"abstract_inverted_index":{"Though":[0],"it":[1],"has":[2],"cost":[3],"great":[4,43],"research":[5],"efforts":[6],"for":[7,171,199],"decades,":[8],"object":[9,34],"recognition":[10],"is":[11,137,164],"still":[12,26],"a":[13,60,80,97],"challenging":[14],"problem.":[15],"Traditional":[16],"methods":[17],"based":[18,155,206],"on":[19,156,207,229],"machine":[20],"learning":[21],"or":[22],"computer":[23],"vision":[24],"are":[25,114],"in":[27,59,106,117,177,202,210],"the":[28,47,66,90,107,127,135,142,146,162,178,194,211,216,221,224],"stage":[29,144],"of":[30,33,49,55,84,145,166,218,223,227],"tackling":[31],"hundreds":[32],"categories.":[35],"In":[36,110],"recent":[37],"years,":[38],"non-parametric":[39],"approaches":[40],"have":[41,187],"demonstrated":[42],"success,":[44],"which":[45,93],"understand":[46],"content":[48],"an":[50],"image":[51,72,85,99,121],"by":[52,126],"propagating":[53],"labels":[54],"its":[56],"similar":[57],"images":[58,151,174,186,201],"large-scale":[61],"dataset.":[62],"However,":[63],"due":[64],"to":[65,95,197],"limited":[67],"dataset":[68],"size":[69],"and":[70,132,154,193],"imperfect":[71],"crawling":[73],"strategy,":[74],"previous":[75],"work":[76],"can":[77,123],"only":[78],"address":[79],"biased":[81],"small":[82],"subset":[83],"concepts.":[86],"Here":[87],"we":[88,113,214],"introduce":[89],"Arista":[91],"project,":[92,112],"aims":[94],"build":[96],"practical":[98],"annotation":[100,129],"engine":[101],"targeting":[102],"at":[103,220],"popular":[104,172],"concepts":[105,122],"real":[108],"world.":[109],"this":[111],"particularly":[115],"interested":[116],"understanding":[118],"how":[119,133],"many":[120],"be":[124],"addressed":[125],"data-driven":[128],"approach":[130],"(coverage)":[131],"good":[134],"performance":[136],"(precision).":[138],"This":[139],"paper":[140],"reports":[141],"first":[143],"work.":[147],"Two":[148],"billions":[149],"web":[150,173,185],"were":[152],"indexed,":[153],"simple":[157],"yet":[158],"effective":[159],"near-duplicate":[160],"detection,":[161],"system":[163],"capable":[165],"automatically":[167],"generating":[168],"accurate":[169],"tags":[170],"having":[175],"near-duplicates":[176],"database.":[179],"We":[180],"found":[181],"that":[182],"about":[183],"8.1%":[184],"more":[188],"than":[189],"ten":[190],"near":[191],"duplicate":[192],"number":[195],"increases":[196],"28.5%":[198],"top":[200],"search":[203],"results.":[204],"Further,":[205],"random":[208],"samples":[209],"latter":[212],"case,":[213],"observed":[215],"precision":[217],"57.9%":[219],"point":[222],"highest":[225],"recall":[226],"28%":[228],"ground":[230],"truth":[231],"tags.":[232]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":6},{"year":2016,"cited_by_count":8},{"year":2015,"cited_by_count":7},{"year":2014,"cited_by_count":8},{"year":2013,"cited_by_count":18},{"year":2012,"cited_by_count":18}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
