{"id":"https://openalex.org/W1997454659","doi":"https://doi.org/10.1109/cvpr.2010.5540135","title":"Harvesting large-scale weakly-tagged image databases from the web","display_name":"Harvesting large-scale weakly-tagged image databases from the web","publication_year":2010,"publication_date":"2010-06-01","ids":{"openalex":"https://openalex.org/W1997454659","doi":"https://doi.org/10.1109/cvpr.2010.5540135","mag":"1997454659"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2010.5540135","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2010.5540135","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100728564","display_name":"Jianping Fan","orcid":"https://orcid.org/0000-0002-4923-0910"},"institutions":[{"id":"https://openalex.org/I102149020","display_name":"University of North Carolina at Charlotte","ror":"https://ror.org/04dawnj30","country_code":"US","type":"education","lineage":["https://openalex.org/I102149020"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jianping Fan","raw_affiliation_strings":["Department of Computer Science, UNC-Charlotte, NC, USA","Department of Computer Science, UNC-Charlotte, NC28223, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, UNC-Charlotte, NC, USA","institution_ids":["https://openalex.org/I102149020"]},{"raw_affiliation_string":"Department of Computer Science, UNC-Charlotte, NC28223, USA#TAB#","institution_ids":["https://openalex.org/I102149020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045434740","display_name":"Yi Shen","orcid":"https://orcid.org/0000-0002-1679-9238"},"institutions":[{"id":"https://openalex.org/I102149020","display_name":"University of North Carolina at Charlotte","ror":"https://ror.org/04dawnj30","country_code":"US","type":"education","lineage":["https://openalex.org/I102149020"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Shen","raw_affiliation_strings":["Department of Computer Science, UNC-Charlotte, NC, USA","Department of Computer Science, UNC-Charlotte, NC28223, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, UNC-Charlotte, NC, USA","institution_ids":["https://openalex.org/I102149020"]},{"raw_affiliation_string":"Department of Computer Science, UNC-Charlotte, NC28223, USA#TAB#","institution_ids":["https://openalex.org/I102149020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049381658","display_name":"Ning Zhou","orcid":"https://orcid.org/0000-0001-5645-7307"},"institutions":[{"id":"https://openalex.org/I102149020","display_name":"University of North Carolina at Charlotte","ror":"https://ror.org/04dawnj30","country_code":"US","type":"education","lineage":["https://openalex.org/I102149020"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ning Zhou","raw_affiliation_strings":["Department of Computer Science, UNC-Charlotte, NC, USA","Department of Computer Science, UNC-Charlotte, NC28223, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, UNC-Charlotte, NC, USA","institution_ids":["https://openalex.org/I102149020"]},{"raw_affiliation_string":"Department of Computer Science, UNC-Charlotte, NC28223, USA#TAB#","institution_ids":["https://openalex.org/I102149020"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102148168","display_name":"Yuli Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I1324840837","display_name":"Hewlett-Packard (United States)","ror":"https://ror.org/059rn9488","country_code":"US","type":"company","lineage":["https://openalex.org/I1324840837"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuli Gao","raw_affiliation_strings":["Multimedia Interaction and Understanding, HP Laboratories, Palo Alto, CA, USA","Multimedia Interaction and Understanding, HP Labs, Palo Alto, CA94304, USA"],"affiliations":[{"raw_affiliation_string":"Multimedia Interaction and Understanding, HP Laboratories, Palo Alto, CA, USA","institution_ids":["https://openalex.org/I1324840837"]},{"raw_affiliation_string":"Multimedia Interaction and Understanding, HP Labs, Palo Alto, CA94304, USA","institution_ids":["https://openalex.org/I1324840837"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100728564"],"corresponding_institution_ids":["https://openalex.org/I102149020"],"apc_list":null,"apc_paid":null,"fwci":8.7291,"has_fulltext":false,"cited_by_count":48,"citation_normalized_percentile":{"value":0.98132358,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"802","last_page":"809"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8101938366889954},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6390159130096436},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5602700114250183},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.554772675037384},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5390915274620056},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4364648759365082},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4308854937553406},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4138428568840027},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.41208183765411377},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39890599250793457}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8101938366889954},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6390159130096436},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5602700114250183},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.554772675037384},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5390915274620056},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4364648759365082},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4308854937553406},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4138428568840027},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.41208183765411377},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39890599250793457},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr.2010.5540135","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2010.5540135","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1578226009","https://openalex.org/W2023170106","https://openalex.org/W2071497990","https://openalex.org/W2080289064","https://openalex.org/W2098020658","https://openalex.org/W2112020727","https://openalex.org/W2113858169","https://openalex.org/W2121947440","https://openalex.org/W2123053055","https://openalex.org/W2130660124","https://openalex.org/W2134135198","https://openalex.org/W2134737843","https://openalex.org/W2145607950","https://openalex.org/W2149056056","https://openalex.org/W2170146448","https://openalex.org/W3070706509","https://openalex.org/W6634576794","https://openalex.org/W6677945368"],"related_works":["https://openalex.org/W2787993192","https://openalex.org/W2375480909","https://openalex.org/W2158269427","https://openalex.org/W4381280689","https://openalex.org/W3033859939","https://openalex.org/W2353314428","https://openalex.org/W2847365777","https://openalex.org/W2012019886","https://openalex.org/W3128025644","https://openalex.org/W2355048207"],"abstract_inverted_index":{"To":[0],"leverage":[1],"large-scale":[2,113],"weakly-tagged":[3,31,114],"images":[4,32,40,59,87,105],"for":[5,28,47,127],"computer":[6,129],"vision":[7,130],"tasks":[8],"(such":[9],"as":[10],"object":[11],"detection":[12],"and":[13,21,33,41,60,77,81,88],"scene":[14],"recognition),":[15],"a":[16],"novel":[17],"cross-modal":[18],"tag":[19],"cleansing":[20,29],"junk":[22],"image":[23],"filtering":[24],"algorithm":[25,69],"is":[26],"developed":[27],"the":[30,43,53,58,61,72,83,86],"their":[34,66,89],"social":[35,90],"tags":[36,46,91],"(i.e.,":[37],"removing":[38],"irrelevant":[39],"finding":[42],"most":[44],"relevant":[45],"each":[48],"image)":[49],"by":[50,110],"integrating":[51],"both":[52],"visual":[54],"similarity":[55,63],"contexts":[56,64],"between":[57,65,85],"semantic":[62],"tags.":[67],"Our":[68],"can":[70,96,117],"address":[71],"issues":[73],"of":[74,103],"spams,":[75],"polysemes":[76],"synonyms":[78],"more":[79,92,107,123],"effectively":[80],"determine":[82],"relevance":[84],"precisely,":[93],"thus":[94],"it":[95],"allow":[97],"us":[98],"to":[99,121],"create":[100],"large":[101],"amounts":[102],"training":[104,126],"with":[106],"reliable":[108],"labels":[109],"harvesting":[111],"from":[112],"images,":[115],"which":[116],"further":[118],"be":[119],"used":[120],"achieve":[122],"effective":[124],"classifier":[125],"many":[128],"tasks.":[131]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":9},{"year":2012,"cited_by_count":8}],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
